Linux Audio

Check our new training course

Loading...
v6.8
   1/*
   2 * Copyright (c) 2004-2007 Voltaire, Inc. All rights reserved.
   3 * Copyright (c) 2005 Intel Corporation.  All rights reserved.
   4 * Copyright (c) 2005 Mellanox Technologies Ltd.  All rights reserved.
   5 * Copyright (c) 2009 HNR Consulting. All rights reserved.
   6 * Copyright (c) 2014,2018 Intel Corporation.  All rights reserved.
   7 *
   8 * This software is available to you under a choice of one of two
   9 * licenses.  You may choose to be licensed under the terms of the GNU
  10 * General Public License (GPL) Version 2, available from the file
  11 * COPYING in the main directory of this source tree, or the
  12 * OpenIB.org BSD license below:
  13 *
  14 *     Redistribution and use in source and binary forms, with or
  15 *     without modification, are permitted provided that the following
  16 *     conditions are met:
  17 *
  18 *      - Redistributions of source code must retain the above
  19 *        copyright notice, this list of conditions and the following
  20 *        disclaimer.
  21 *
  22 *      - Redistributions in binary form must reproduce the above
  23 *        copyright notice, this list of conditions and the following
  24 *        disclaimer in the documentation and/or other materials
  25 *        provided with the distribution.
  26 *
  27 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  28 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  29 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  30 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  31 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  32 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  33 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  34 * SOFTWARE.
  35 *
  36 */
  37
  38#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  39
  40#include <linux/dma-mapping.h>
  41#include <linux/slab.h>
  42#include <linux/module.h>
  43#include <linux/security.h>
  44#include <linux/xarray.h>
  45#include <rdma/ib_cache.h>
  46
  47#include "mad_priv.h"
  48#include "core_priv.h"
  49#include "mad_rmpp.h"
  50#include "smi.h"
  51#include "opa_smi.h"
  52#include "agent.h"
  53
  54#define CREATE_TRACE_POINTS
  55#include <trace/events/ib_mad.h>
  56
  57#ifdef CONFIG_TRACEPOINTS
  58static void create_mad_addr_info(struct ib_mad_send_wr_private *mad_send_wr,
  59			  struct ib_mad_qp_info *qp_info,
  60			  struct trace_event_raw_ib_mad_send_template *entry)
  61{
  62	struct ib_ud_wr *wr = &mad_send_wr->send_wr;
  63	struct rdma_ah_attr attr = {};
  64
  65	rdma_query_ah(wr->ah, &attr);
  66
  67	/* These are common */
  68	entry->sl = attr.sl;
  69	entry->rqpn = wr->remote_qpn;
  70	entry->rqkey = wr->remote_qkey;
  71	entry->dlid = rdma_ah_get_dlid(&attr);
  72}
  73#endif
  74
  75static int mad_sendq_size = IB_MAD_QP_SEND_SIZE;
  76static int mad_recvq_size = IB_MAD_QP_RECV_SIZE;
  77
  78module_param_named(send_queue_size, mad_sendq_size, int, 0444);
  79MODULE_PARM_DESC(send_queue_size, "Size of send queue in number of work requests");
  80module_param_named(recv_queue_size, mad_recvq_size, int, 0444);
  81MODULE_PARM_DESC(recv_queue_size, "Size of receive queue in number of work requests");
  82
  83static DEFINE_XARRAY_ALLOC1(ib_mad_clients);
  84static u32 ib_mad_client_next;
  85static struct list_head ib_mad_port_list;
 
  86
  87/* Port list lock */
  88static DEFINE_SPINLOCK(ib_mad_port_list_lock);
  89
  90/* Forward declarations */
  91static int method_in_use(struct ib_mad_mgmt_method_table **method,
  92			 struct ib_mad_reg_req *mad_reg_req);
  93static void remove_mad_reg_req(struct ib_mad_agent_private *priv);
  94static struct ib_mad_agent_private *find_mad_agent(
  95					struct ib_mad_port_private *port_priv,
  96					const struct ib_mad_hdr *mad);
  97static int ib_mad_post_receive_mads(struct ib_mad_qp_info *qp_info,
  98				    struct ib_mad_private *mad);
  99static void cancel_mads(struct ib_mad_agent_private *mad_agent_priv);
 100static void timeout_sends(struct work_struct *work);
 101static void local_completions(struct work_struct *work);
 102static int add_nonoui_reg_req(struct ib_mad_reg_req *mad_reg_req,
 103			      struct ib_mad_agent_private *agent_priv,
 104			      u8 mgmt_class);
 105static int add_oui_reg_req(struct ib_mad_reg_req *mad_reg_req,
 106			   struct ib_mad_agent_private *agent_priv);
 107static bool ib_mad_send_error(struct ib_mad_port_private *port_priv,
 108			      struct ib_wc *wc);
 109static void ib_mad_send_done(struct ib_cq *cq, struct ib_wc *wc);
 110
 111/*
 112 * Returns a ib_mad_port_private structure or NULL for a device/port
 113 * Assumes ib_mad_port_list_lock is being held
 114 */
 115static inline struct ib_mad_port_private *
 116__ib_get_mad_port(struct ib_device *device, u32 port_num)
 117{
 118	struct ib_mad_port_private *entry;
 119
 120	list_for_each_entry(entry, &ib_mad_port_list, port_list) {
 121		if (entry->device == device && entry->port_num == port_num)
 122			return entry;
 123	}
 124	return NULL;
 125}
 126
 127/*
 128 * Wrapper function to return a ib_mad_port_private structure or NULL
 129 * for a device/port
 130 */
 131static inline struct ib_mad_port_private *
 132ib_get_mad_port(struct ib_device *device, u32 port_num)
 133{
 134	struct ib_mad_port_private *entry;
 135	unsigned long flags;
 136
 137	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
 138	entry = __ib_get_mad_port(device, port_num);
 139	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
 140
 141	return entry;
 142}
 143
 144static inline u8 convert_mgmt_class(u8 mgmt_class)
 145{
 146	/* Alias IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE to 0 */
 147	return mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE ?
 148		0 : mgmt_class;
 149}
 150
 151static int get_spl_qp_index(enum ib_qp_type qp_type)
 152{
 153	switch (qp_type) {
 
 154	case IB_QPT_SMI:
 155		return 0;
 156	case IB_QPT_GSI:
 157		return 1;
 158	default:
 159		return -1;
 160	}
 161}
 162
 163static int vendor_class_index(u8 mgmt_class)
 164{
 165	return mgmt_class - IB_MGMT_CLASS_VENDOR_RANGE2_START;
 166}
 167
 168static int is_vendor_class(u8 mgmt_class)
 169{
 170	if ((mgmt_class < IB_MGMT_CLASS_VENDOR_RANGE2_START) ||
 171	    (mgmt_class > IB_MGMT_CLASS_VENDOR_RANGE2_END))
 172		return 0;
 173	return 1;
 174}
 175
 176static int is_vendor_oui(char *oui)
 177{
 178	if (oui[0] || oui[1] || oui[2])
 179		return 1;
 180	return 0;
 181}
 182
 183static int is_vendor_method_in_use(
 184		struct ib_mad_mgmt_vendor_class *vendor_class,
 185		struct ib_mad_reg_req *mad_reg_req)
 186{
 187	struct ib_mad_mgmt_method_table *method;
 188	int i;
 189
 190	for (i = 0; i < MAX_MGMT_OUI; i++) {
 191		if (!memcmp(vendor_class->oui[i], mad_reg_req->oui, 3)) {
 192			method = vendor_class->method_table[i];
 193			if (method) {
 194				if (method_in_use(&method, mad_reg_req))
 195					return 1;
 196				else
 197					break;
 198			}
 199		}
 200	}
 201	return 0;
 202}
 203
 204int ib_response_mad(const struct ib_mad_hdr *hdr)
 205{
 206	return ((hdr->method & IB_MGMT_METHOD_RESP) ||
 207		(hdr->method == IB_MGMT_METHOD_TRAP_REPRESS) ||
 208		((hdr->mgmt_class == IB_MGMT_CLASS_BM) &&
 209		 (hdr->attr_mod & IB_BM_ATTR_MOD_RESP)));
 210}
 211EXPORT_SYMBOL(ib_response_mad);
 212
 213/*
 214 * ib_register_mad_agent - Register to send/receive MADs
 215 *
 216 * Context: Process context.
 217 */
 218struct ib_mad_agent *ib_register_mad_agent(struct ib_device *device,
 219					   u32 port_num,
 220					   enum ib_qp_type qp_type,
 221					   struct ib_mad_reg_req *mad_reg_req,
 222					   u8 rmpp_version,
 223					   ib_mad_send_handler send_handler,
 224					   ib_mad_recv_handler recv_handler,
 225					   void *context,
 226					   u32 registration_flags)
 227{
 228	struct ib_mad_port_private *port_priv;
 229	struct ib_mad_agent *ret = ERR_PTR(-EINVAL);
 230	struct ib_mad_agent_private *mad_agent_priv;
 231	struct ib_mad_reg_req *reg_req = NULL;
 232	struct ib_mad_mgmt_class_table *class;
 233	struct ib_mad_mgmt_vendor_class_table *vendor;
 234	struct ib_mad_mgmt_vendor_class *vendor_class;
 235	struct ib_mad_mgmt_method_table *method;
 236	int ret2, qpn;
 
 237	u8 mgmt_class, vclass;
 238
 239	if ((qp_type == IB_QPT_SMI && !rdma_cap_ib_smi(device, port_num)) ||
 240	    (qp_type == IB_QPT_GSI && !rdma_cap_ib_cm(device, port_num)))
 241		return ERR_PTR(-EPROTONOSUPPORT);
 242
 243	/* Validate parameters */
 244	qpn = get_spl_qp_index(qp_type);
 245	if (qpn == -1) {
 246		dev_dbg_ratelimited(&device->dev, "%s: invalid QP Type %d\n",
 247				    __func__, qp_type);
 248		goto error1;
 249	}
 250
 251	if (rmpp_version && rmpp_version != IB_MGMT_RMPP_VERSION) {
 252		dev_dbg_ratelimited(&device->dev,
 253				    "%s: invalid RMPP Version %u\n",
 254				    __func__, rmpp_version);
 255		goto error1;
 256	}
 257
 258	/* Validate MAD registration request if supplied */
 259	if (mad_reg_req) {
 260		if (mad_reg_req->mgmt_class_version >= MAX_MGMT_VERSION) {
 261			dev_dbg_ratelimited(&device->dev,
 262					    "%s: invalid Class Version %u\n",
 263					    __func__,
 264					    mad_reg_req->mgmt_class_version);
 265			goto error1;
 266		}
 267		if (!recv_handler) {
 268			dev_dbg_ratelimited(&device->dev,
 269					    "%s: no recv_handler\n", __func__);
 270			goto error1;
 271		}
 272		if (mad_reg_req->mgmt_class >= MAX_MGMT_CLASS) {
 273			/*
 274			 * IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE is the only
 275			 * one in this range currently allowed
 276			 */
 277			if (mad_reg_req->mgmt_class !=
 278			    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE) {
 279				dev_dbg_ratelimited(&device->dev,
 280					"%s: Invalid Mgmt Class 0x%x\n",
 281					__func__, mad_reg_req->mgmt_class);
 282				goto error1;
 283			}
 284		} else if (mad_reg_req->mgmt_class == 0) {
 285			/*
 286			 * Class 0 is reserved in IBA and is used for
 287			 * aliasing of IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE
 288			 */
 289			dev_dbg_ratelimited(&device->dev,
 290					    "%s: Invalid Mgmt Class 0\n",
 291					    __func__);
 292			goto error1;
 293		} else if (is_vendor_class(mad_reg_req->mgmt_class)) {
 294			/*
 295			 * If class is in "new" vendor range,
 296			 * ensure supplied OUI is not zero
 297			 */
 298			if (!is_vendor_oui(mad_reg_req->oui)) {
 299				dev_dbg_ratelimited(&device->dev,
 300					"%s: No OUI specified for class 0x%x\n",
 301					__func__,
 302					mad_reg_req->mgmt_class);
 303				goto error1;
 304			}
 305		}
 306		/* Make sure class supplied is consistent with RMPP */
 307		if (!ib_is_mad_class_rmpp(mad_reg_req->mgmt_class)) {
 308			if (rmpp_version) {
 309				dev_dbg_ratelimited(&device->dev,
 310					"%s: RMPP version for non-RMPP class 0x%x\n",
 311					__func__, mad_reg_req->mgmt_class);
 312				goto error1;
 313			}
 314		}
 315
 316		/* Make sure class supplied is consistent with QP type */
 317		if (qp_type == IB_QPT_SMI) {
 318			if ((mad_reg_req->mgmt_class !=
 319					IB_MGMT_CLASS_SUBN_LID_ROUTED) &&
 320			    (mad_reg_req->mgmt_class !=
 321					IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)) {
 322				dev_dbg_ratelimited(&device->dev,
 323					"%s: Invalid SM QP type: class 0x%x\n",
 324					__func__, mad_reg_req->mgmt_class);
 325				goto error1;
 326			}
 327		} else {
 328			if ((mad_reg_req->mgmt_class ==
 329					IB_MGMT_CLASS_SUBN_LID_ROUTED) ||
 330			    (mad_reg_req->mgmt_class ==
 331					IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)) {
 332				dev_dbg_ratelimited(&device->dev,
 333					"%s: Invalid GS QP type: class 0x%x\n",
 334					__func__, mad_reg_req->mgmt_class);
 335				goto error1;
 336			}
 337		}
 338	} else {
 339		/* No registration request supplied */
 340		if (!send_handler)
 341			goto error1;
 342		if (registration_flags & IB_MAD_USER_RMPP)
 343			goto error1;
 344	}
 345
 346	/* Validate device and port */
 347	port_priv = ib_get_mad_port(device, port_num);
 348	if (!port_priv) {
 349		dev_dbg_ratelimited(&device->dev, "%s: Invalid port %u\n",
 350				    __func__, port_num);
 351		ret = ERR_PTR(-ENODEV);
 352		goto error1;
 353	}
 354
 355	/* Verify the QP requested is supported. For example, Ethernet devices
 356	 * will not have QP0.
 357	 */
 358	if (!port_priv->qp_info[qpn].qp) {
 359		dev_dbg_ratelimited(&device->dev, "%s: QP %d not supported\n",
 360				    __func__, qpn);
 361		ret = ERR_PTR(-EPROTONOSUPPORT);
 362		goto error1;
 363	}
 364
 365	/* Allocate structures */
 366	mad_agent_priv = kzalloc(sizeof *mad_agent_priv, GFP_KERNEL);
 367	if (!mad_agent_priv) {
 368		ret = ERR_PTR(-ENOMEM);
 369		goto error1;
 370	}
 371
 
 
 
 
 
 
 
 372	if (mad_reg_req) {
 373		reg_req = kmemdup(mad_reg_req, sizeof *reg_req, GFP_KERNEL);
 374		if (!reg_req) {
 375			ret = ERR_PTR(-ENOMEM);
 376			goto error3;
 377		}
 378	}
 379
 380	/* Now, fill in the various structures */
 381	mad_agent_priv->qp_info = &port_priv->qp_info[qpn];
 382	mad_agent_priv->reg_req = reg_req;
 383	mad_agent_priv->agent.rmpp_version = rmpp_version;
 384	mad_agent_priv->agent.device = device;
 385	mad_agent_priv->agent.recv_handler = recv_handler;
 386	mad_agent_priv->agent.send_handler = send_handler;
 387	mad_agent_priv->agent.context = context;
 388	mad_agent_priv->agent.qp = port_priv->qp_info[qpn].qp;
 389	mad_agent_priv->agent.port_num = port_num;
 390	mad_agent_priv->agent.flags = registration_flags;
 391	spin_lock_init(&mad_agent_priv->lock);
 392	INIT_LIST_HEAD(&mad_agent_priv->send_list);
 393	INIT_LIST_HEAD(&mad_agent_priv->wait_list);
 394	INIT_LIST_HEAD(&mad_agent_priv->done_list);
 395	INIT_LIST_HEAD(&mad_agent_priv->rmpp_list);
 396	INIT_DELAYED_WORK(&mad_agent_priv->timed_work, timeout_sends);
 397	INIT_LIST_HEAD(&mad_agent_priv->local_list);
 398	INIT_WORK(&mad_agent_priv->local_work, local_completions);
 399	refcount_set(&mad_agent_priv->refcount, 1);
 400	init_completion(&mad_agent_priv->comp);
 401
 402	ret2 = ib_mad_agent_security_setup(&mad_agent_priv->agent, qp_type);
 403	if (ret2) {
 404		ret = ERR_PTR(ret2);
 405		goto error4;
 406	}
 407
 408	/*
 409	 * The mlx4 driver uses the top byte to distinguish which virtual
 410	 * function generated the MAD, so we must avoid using it.
 411	 */
 412	ret2 = xa_alloc_cyclic(&ib_mad_clients, &mad_agent_priv->agent.hi_tid,
 413			mad_agent_priv, XA_LIMIT(0, (1 << 24) - 1),
 414			&ib_mad_client_next, GFP_KERNEL);
 415	if (ret2 < 0) {
 416		ret = ERR_PTR(ret2);
 417		goto error5;
 418	}
 419
 420	/*
 421	 * Make sure MAD registration (if supplied)
 422	 * is non overlapping with any existing ones
 423	 */
 424	spin_lock_irq(&port_priv->reg_lock);
 425	if (mad_reg_req) {
 426		mgmt_class = convert_mgmt_class(mad_reg_req->mgmt_class);
 427		if (!is_vendor_class(mgmt_class)) {
 428			class = port_priv->version[mad_reg_req->
 429						   mgmt_class_version].class;
 430			if (class) {
 431				method = class->method_table[mgmt_class];
 432				if (method) {
 433					if (method_in_use(&method,
 434							   mad_reg_req))
 435						goto error6;
 436				}
 437			}
 438			ret2 = add_nonoui_reg_req(mad_reg_req, mad_agent_priv,
 439						  mgmt_class);
 440		} else {
 441			/* "New" vendor class range */
 442			vendor = port_priv->version[mad_reg_req->
 443						    mgmt_class_version].vendor;
 444			if (vendor) {
 445				vclass = vendor_class_index(mgmt_class);
 446				vendor_class = vendor->vendor_class[vclass];
 447				if (vendor_class) {
 448					if (is_vendor_method_in_use(
 449							vendor_class,
 450							mad_reg_req))
 451						goto error6;
 452				}
 453			}
 454			ret2 = add_oui_reg_req(mad_reg_req, mad_agent_priv);
 455		}
 456		if (ret2) {
 457			ret = ERR_PTR(ret2);
 458			goto error6;
 459		}
 460	}
 461	spin_unlock_irq(&port_priv->reg_lock);
 462
 463	trace_ib_mad_create_agent(mad_agent_priv);
 
 
 
 464	return &mad_agent_priv->agent;
 465error6:
 466	spin_unlock_irq(&port_priv->reg_lock);
 467	xa_erase(&ib_mad_clients, mad_agent_priv->agent.hi_tid);
 468error5:
 469	ib_mad_agent_security_cleanup(&mad_agent_priv->agent);
 470error4:
 
 471	kfree(reg_req);
 472error3:
 
 
 473	kfree(mad_agent_priv);
 474error1:
 475	return ret;
 476}
 477EXPORT_SYMBOL(ib_register_mad_agent);
 478
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 479static inline void deref_mad_agent(struct ib_mad_agent_private *mad_agent_priv)
 480{
 481	if (refcount_dec_and_test(&mad_agent_priv->refcount))
 482		complete(&mad_agent_priv->comp);
 483}
 484
 
 
 
 
 
 
 485static void unregister_mad_agent(struct ib_mad_agent_private *mad_agent_priv)
 486{
 487	struct ib_mad_port_private *port_priv;
 
 488
 489	/* Note that we could still be handling received MADs */
 490	trace_ib_mad_unregister_agent(mad_agent_priv);
 491
 492	/*
 493	 * Canceling all sends results in dropping received response
 494	 * MADs, preventing us from queuing additional work
 495	 */
 496	cancel_mads(mad_agent_priv);
 497	port_priv = mad_agent_priv->qp_info->port_priv;
 498	cancel_delayed_work(&mad_agent_priv->timed_work);
 499
 500	spin_lock_irq(&port_priv->reg_lock);
 501	remove_mad_reg_req(mad_agent_priv);
 502	spin_unlock_irq(&port_priv->reg_lock);
 503	xa_erase(&ib_mad_clients, mad_agent_priv->agent.hi_tid);
 504
 505	flush_workqueue(port_priv->wq);
 
 506
 507	deref_mad_agent(mad_agent_priv);
 508	wait_for_completion(&mad_agent_priv->comp);
 509	ib_cancel_rmpp_recvs(mad_agent_priv);
 510
 511	ib_mad_agent_security_cleanup(&mad_agent_priv->agent);
 512
 513	kfree(mad_agent_priv->reg_req);
 514	kfree_rcu(mad_agent_priv, rcu);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 515}
 516
 517/*
 518 * ib_unregister_mad_agent - Unregisters a client from using MAD services
 519 *
 520 * Context: Process context.
 521 */
 522void ib_unregister_mad_agent(struct ib_mad_agent *mad_agent)
 523{
 524	struct ib_mad_agent_private *mad_agent_priv;
 
 525
 526	mad_agent_priv = container_of(mad_agent,
 527				      struct ib_mad_agent_private,
 528				      agent);
 529	unregister_mad_agent(mad_agent_priv);
 
 
 
 
 
 
 
 
 
 530}
 531EXPORT_SYMBOL(ib_unregister_mad_agent);
 532
 533static void dequeue_mad(struct ib_mad_list_head *mad_list)
 534{
 535	struct ib_mad_queue *mad_queue;
 536	unsigned long flags;
 537
 
 538	mad_queue = mad_list->mad_queue;
 539	spin_lock_irqsave(&mad_queue->lock, flags);
 540	list_del(&mad_list->list);
 541	mad_queue->count--;
 542	spin_unlock_irqrestore(&mad_queue->lock, flags);
 543}
 544
 545static void build_smp_wc(struct ib_qp *qp, struct ib_cqe *cqe, u16 slid,
 546		u16 pkey_index, u32 port_num, struct ib_wc *wc)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 547{
 548	memset(wc, 0, sizeof *wc);
 549	wc->wr_cqe = cqe;
 550	wc->status = IB_WC_SUCCESS;
 551	wc->opcode = IB_WC_RECV;
 552	wc->pkey_index = pkey_index;
 553	wc->byte_len = sizeof(struct ib_mad) + sizeof(struct ib_grh);
 554	wc->src_qp = IB_QP0;
 555	wc->qp = qp;
 556	wc->slid = slid;
 557	wc->sl = 0;
 558	wc->dlid_path_bits = 0;
 559	wc->port_num = port_num;
 560}
 561
 562static size_t mad_priv_size(const struct ib_mad_private *mp)
 563{
 564	return sizeof(struct ib_mad_private) + mp->mad_size;
 565}
 566
 567static struct ib_mad_private *alloc_mad_private(size_t mad_size, gfp_t flags)
 568{
 569	size_t size = sizeof(struct ib_mad_private) + mad_size;
 570	struct ib_mad_private *ret = kzalloc(size, flags);
 571
 572	if (ret)
 573		ret->mad_size = mad_size;
 574
 575	return ret;
 576}
 577
 578static size_t port_mad_size(const struct ib_mad_port_private *port_priv)
 579{
 580	return rdma_max_mad_size(port_priv->device, port_priv->port_num);
 581}
 582
 583static size_t mad_priv_dma_size(const struct ib_mad_private *mp)
 584{
 585	return sizeof(struct ib_grh) + mp->mad_size;
 586}
 587
 588/*
 589 * Return 0 if SMP is to be sent
 590 * Return 1 if SMP was consumed locally (whether or not solicited)
 591 * Return < 0 if error
 592 */
 593static int handle_outgoing_dr_smp(struct ib_mad_agent_private *mad_agent_priv,
 594				  struct ib_mad_send_wr_private *mad_send_wr)
 595{
 596	int ret = 0;
 597	struct ib_smp *smp = mad_send_wr->send_buf.mad;
 598	struct opa_smp *opa_smp = (struct opa_smp *)smp;
 599	unsigned long flags;
 600	struct ib_mad_local_private *local;
 601	struct ib_mad_private *mad_priv;
 602	struct ib_mad_port_private *port_priv;
 603	struct ib_mad_agent_private *recv_mad_agent = NULL;
 604	struct ib_device *device = mad_agent_priv->agent.device;
 605	u32 port_num;
 606	struct ib_wc mad_wc;
 607	struct ib_ud_wr *send_wr = &mad_send_wr->send_wr;
 608	size_t mad_size = port_mad_size(mad_agent_priv->qp_info->port_priv);
 609	u16 out_mad_pkey_index = 0;
 610	u16 drslid;
 611	bool opa = rdma_cap_opa_mad(mad_agent_priv->qp_info->port_priv->device,
 612				    mad_agent_priv->qp_info->port_priv->port_num);
 613
 614	if (rdma_cap_ib_switch(device) &&
 615	    smp->mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)
 616		port_num = send_wr->port_num;
 617	else
 618		port_num = mad_agent_priv->agent.port_num;
 619
 620	/*
 621	 * Directed route handling starts if the initial LID routed part of
 622	 * a request or the ending LID routed part of a response is empty.
 623	 * If we are at the start of the LID routed part, don't update the
 624	 * hop_ptr or hop_cnt.  See section 14.2.2, Vol 1 IB spec.
 625	 */
 626	if (opa && smp->class_version == OPA_SM_CLASS_VERSION) {
 627		u32 opa_drslid;
 628
 629		trace_ib_mad_handle_out_opa_smi(opa_smp);
 630
 631		if ((opa_get_smp_direction(opa_smp)
 632		     ? opa_smp->route.dr.dr_dlid : opa_smp->route.dr.dr_slid) ==
 633		     OPA_LID_PERMISSIVE &&
 634		     opa_smi_handle_dr_smp_send(opa_smp,
 635						rdma_cap_ib_switch(device),
 636						port_num) == IB_SMI_DISCARD) {
 637			ret = -EINVAL;
 638			dev_err(&device->dev, "OPA Invalid directed route\n");
 639			goto out;
 640		}
 641		opa_drslid = be32_to_cpu(opa_smp->route.dr.dr_slid);
 642		if (opa_drslid != be32_to_cpu(OPA_LID_PERMISSIVE) &&
 643		    opa_drslid & 0xffff0000) {
 644			ret = -EINVAL;
 645			dev_err(&device->dev, "OPA Invalid dr_slid 0x%x\n",
 646			       opa_drslid);
 647			goto out;
 648		}
 649		drslid = (u16)(opa_drslid & 0x0000ffff);
 650
 651		/* Check to post send on QP or process locally */
 652		if (opa_smi_check_local_smp(opa_smp, device) == IB_SMI_DISCARD &&
 653		    opa_smi_check_local_returning_smp(opa_smp, device) == IB_SMI_DISCARD)
 654			goto out;
 655	} else {
 656		trace_ib_mad_handle_out_ib_smi(smp);
 657
 658		if ((ib_get_smp_direction(smp) ? smp->dr_dlid : smp->dr_slid) ==
 659		     IB_LID_PERMISSIVE &&
 660		     smi_handle_dr_smp_send(smp, rdma_cap_ib_switch(device), port_num) ==
 661		     IB_SMI_DISCARD) {
 662			ret = -EINVAL;
 663			dev_err(&device->dev, "Invalid directed route\n");
 664			goto out;
 665		}
 666		drslid = be16_to_cpu(smp->dr_slid);
 667
 668		/* Check to post send on QP or process locally */
 669		if (smi_check_local_smp(smp, device) == IB_SMI_DISCARD &&
 670		    smi_check_local_returning_smp(smp, device) == IB_SMI_DISCARD)
 671			goto out;
 672	}
 673
 
 
 
 
 
 674	local = kmalloc(sizeof *local, GFP_ATOMIC);
 675	if (!local) {
 676		ret = -ENOMEM;
 
 677		goto out;
 678	}
 679	local->mad_priv = NULL;
 680	local->recv_mad_agent = NULL;
 681	mad_priv = alloc_mad_private(mad_size, GFP_ATOMIC);
 682	if (!mad_priv) {
 683		ret = -ENOMEM;
 
 684		kfree(local);
 685		goto out;
 686	}
 687
 688	build_smp_wc(mad_agent_priv->agent.qp,
 689		     send_wr->wr.wr_cqe, drslid,
 690		     send_wr->pkey_index,
 691		     send_wr->port_num, &mad_wc);
 692
 693	if (opa && smp->base_version == OPA_MGMT_BASE_VERSION) {
 694		mad_wc.byte_len = mad_send_wr->send_buf.hdr_len
 695					+ mad_send_wr->send_buf.data_len
 696					+ sizeof(struct ib_grh);
 697	}
 698
 699	/* No GRH for DR SMP */
 700	ret = device->ops.process_mad(device, 0, port_num, &mad_wc, NULL,
 701				      (const struct ib_mad *)smp,
 702				      (struct ib_mad *)mad_priv->mad, &mad_size,
 703				      &out_mad_pkey_index);
 704	switch (ret) {
 705	case IB_MAD_RESULT_SUCCESS | IB_MAD_RESULT_REPLY:
 706		if (ib_response_mad((const struct ib_mad_hdr *)mad_priv->mad) &&
 707		    mad_agent_priv->agent.recv_handler) {
 708			local->mad_priv = mad_priv;
 709			local->recv_mad_agent = mad_agent_priv;
 710			/*
 711			 * Reference MAD agent until receive
 712			 * side of local completion handled
 713			 */
 714			refcount_inc(&mad_agent_priv->refcount);
 715		} else
 716			kfree(mad_priv);
 717		break;
 718	case IB_MAD_RESULT_SUCCESS | IB_MAD_RESULT_CONSUMED:
 719		kfree(mad_priv);
 720		break;
 721	case IB_MAD_RESULT_SUCCESS:
 722		/* Treat like an incoming receive MAD */
 723		port_priv = ib_get_mad_port(mad_agent_priv->agent.device,
 724					    mad_agent_priv->agent.port_num);
 725		if (port_priv) {
 726			memcpy(mad_priv->mad, smp, mad_priv->mad_size);
 727			recv_mad_agent = find_mad_agent(port_priv,
 728						        (const struct ib_mad_hdr *)mad_priv->mad);
 729		}
 730		if (!port_priv || !recv_mad_agent) {
 731			/*
 732			 * No receiving agent so drop packet and
 733			 * generate send completion.
 734			 */
 735			kfree(mad_priv);
 736			break;
 737		}
 738		local->mad_priv = mad_priv;
 739		local->recv_mad_agent = recv_mad_agent;
 740		break;
 741	default:
 742		kfree(mad_priv);
 743		kfree(local);
 744		ret = -EINVAL;
 745		goto out;
 746	}
 747
 748	local->mad_send_wr = mad_send_wr;
 749	if (opa) {
 750		local->mad_send_wr->send_wr.pkey_index = out_mad_pkey_index;
 751		local->return_wc_byte_len = mad_size;
 752	}
 753	/* Reference MAD agent until send side of local completion handled */
 754	refcount_inc(&mad_agent_priv->refcount);
 755	/* Queue local completion to local list */
 756	spin_lock_irqsave(&mad_agent_priv->lock, flags);
 757	list_add_tail(&local->completion_list, &mad_agent_priv->local_list);
 758	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
 759	queue_work(mad_agent_priv->qp_info->port_priv->wq,
 760		   &mad_agent_priv->local_work);
 761	ret = 1;
 762out:
 763	return ret;
 764}
 765
 766static int get_pad_size(int hdr_len, int data_len, size_t mad_size)
 767{
 768	int seg_size, pad;
 769
 770	seg_size = mad_size - hdr_len;
 771	if (data_len && seg_size) {
 772		pad = seg_size - data_len % seg_size;
 773		return pad == seg_size ? 0 : pad;
 774	} else
 775		return seg_size;
 776}
 777
 778static void free_send_rmpp_list(struct ib_mad_send_wr_private *mad_send_wr)
 779{
 780	struct ib_rmpp_segment *s, *t;
 781
 782	list_for_each_entry_safe(s, t, &mad_send_wr->rmpp_list, list) {
 783		list_del(&s->list);
 784		kfree(s);
 785	}
 786}
 787
 788static int alloc_send_rmpp_list(struct ib_mad_send_wr_private *send_wr,
 789				size_t mad_size, gfp_t gfp_mask)
 790{
 791	struct ib_mad_send_buf *send_buf = &send_wr->send_buf;
 792	struct ib_rmpp_mad *rmpp_mad = send_buf->mad;
 793	struct ib_rmpp_segment *seg = NULL;
 794	int left, seg_size, pad;
 795
 796	send_buf->seg_size = mad_size - send_buf->hdr_len;
 797	send_buf->seg_rmpp_size = mad_size - IB_MGMT_RMPP_HDR;
 798	seg_size = send_buf->seg_size;
 799	pad = send_wr->pad;
 800
 801	/* Allocate data segments. */
 802	for (left = send_buf->data_len + pad; left > 0; left -= seg_size) {
 803		seg = kmalloc(sizeof(*seg) + seg_size, gfp_mask);
 804		if (!seg) {
 
 
 
 805			free_send_rmpp_list(send_wr);
 806			return -ENOMEM;
 807		}
 808		seg->num = ++send_buf->seg_count;
 809		list_add_tail(&seg->list, &send_wr->rmpp_list);
 810	}
 811
 812	/* Zero any padding */
 813	if (pad)
 814		memset(seg->data + seg_size - pad, 0, pad);
 815
 816	rmpp_mad->rmpp_hdr.rmpp_version = send_wr->mad_agent_priv->
 817					  agent.rmpp_version;
 818	rmpp_mad->rmpp_hdr.rmpp_type = IB_MGMT_RMPP_TYPE_DATA;
 819	ib_set_rmpp_flags(&rmpp_mad->rmpp_hdr, IB_MGMT_RMPP_FLAG_ACTIVE);
 820
 821	send_wr->cur_seg = container_of(send_wr->rmpp_list.next,
 822					struct ib_rmpp_segment, list);
 823	send_wr->last_ack_seg = send_wr->cur_seg;
 824	return 0;
 825}
 826
 827int ib_mad_kernel_rmpp_agent(const struct ib_mad_agent *agent)
 828{
 829	return agent->rmpp_version && !(agent->flags & IB_MAD_USER_RMPP);
 830}
 831EXPORT_SYMBOL(ib_mad_kernel_rmpp_agent);
 832
 833struct ib_mad_send_buf *ib_create_send_mad(struct ib_mad_agent *mad_agent,
 834					   u32 remote_qpn, u16 pkey_index,
 835					   int rmpp_active, int hdr_len,
 836					   int data_len, gfp_t gfp_mask,
 837					   u8 base_version)
 838{
 839	struct ib_mad_agent_private *mad_agent_priv;
 840	struct ib_mad_send_wr_private *mad_send_wr;
 841	int pad, message_size, ret, size;
 842	void *buf;
 843	size_t mad_size;
 844	bool opa;
 845
 846	mad_agent_priv = container_of(mad_agent, struct ib_mad_agent_private,
 847				      agent);
 848
 849	opa = rdma_cap_opa_mad(mad_agent->device, mad_agent->port_num);
 850
 851	if (opa && base_version == OPA_MGMT_BASE_VERSION)
 852		mad_size = sizeof(struct opa_mad);
 853	else
 854		mad_size = sizeof(struct ib_mad);
 855
 856	pad = get_pad_size(hdr_len, data_len, mad_size);
 857	message_size = hdr_len + data_len + pad;
 858
 859	if (ib_mad_kernel_rmpp_agent(mad_agent)) {
 860		if (!rmpp_active && message_size > mad_size)
 861			return ERR_PTR(-EINVAL);
 862	} else
 863		if (rmpp_active || message_size > mad_size)
 864			return ERR_PTR(-EINVAL);
 865
 866	size = rmpp_active ? hdr_len : mad_size;
 867	buf = kzalloc(sizeof *mad_send_wr + size, gfp_mask);
 868	if (!buf)
 869		return ERR_PTR(-ENOMEM);
 870
 871	mad_send_wr = buf + size;
 872	INIT_LIST_HEAD(&mad_send_wr->rmpp_list);
 873	mad_send_wr->send_buf.mad = buf;
 874	mad_send_wr->send_buf.hdr_len = hdr_len;
 875	mad_send_wr->send_buf.data_len = data_len;
 876	mad_send_wr->pad = pad;
 877
 878	mad_send_wr->mad_agent_priv = mad_agent_priv;
 879	mad_send_wr->sg_list[0].length = hdr_len;
 880	mad_send_wr->sg_list[0].lkey = mad_agent->qp->pd->local_dma_lkey;
 881
 882	/* OPA MADs don't have to be the full 2048 bytes */
 883	if (opa && base_version == OPA_MGMT_BASE_VERSION &&
 884	    data_len < mad_size - hdr_len)
 885		mad_send_wr->sg_list[1].length = data_len;
 886	else
 887		mad_send_wr->sg_list[1].length = mad_size - hdr_len;
 888
 889	mad_send_wr->sg_list[1].lkey = mad_agent->qp->pd->local_dma_lkey;
 890
 891	mad_send_wr->mad_list.cqe.done = ib_mad_send_done;
 892
 893	mad_send_wr->send_wr.wr.wr_cqe = &mad_send_wr->mad_list.cqe;
 894	mad_send_wr->send_wr.wr.sg_list = mad_send_wr->sg_list;
 895	mad_send_wr->send_wr.wr.num_sge = 2;
 896	mad_send_wr->send_wr.wr.opcode = IB_WR_SEND;
 897	mad_send_wr->send_wr.wr.send_flags = IB_SEND_SIGNALED;
 898	mad_send_wr->send_wr.remote_qpn = remote_qpn;
 899	mad_send_wr->send_wr.remote_qkey = IB_QP_SET_QKEY;
 900	mad_send_wr->send_wr.pkey_index = pkey_index;
 901
 902	if (rmpp_active) {
 903		ret = alloc_send_rmpp_list(mad_send_wr, mad_size, gfp_mask);
 904		if (ret) {
 905			kfree(buf);
 906			return ERR_PTR(ret);
 907		}
 908	}
 909
 910	mad_send_wr->send_buf.mad_agent = mad_agent;
 911	refcount_inc(&mad_agent_priv->refcount);
 912	return &mad_send_wr->send_buf;
 913}
 914EXPORT_SYMBOL(ib_create_send_mad);
 915
 916int ib_get_mad_data_offset(u8 mgmt_class)
 917{
 918	if (mgmt_class == IB_MGMT_CLASS_SUBN_ADM)
 919		return IB_MGMT_SA_HDR;
 920	else if ((mgmt_class == IB_MGMT_CLASS_DEVICE_MGMT) ||
 921		 (mgmt_class == IB_MGMT_CLASS_DEVICE_ADM) ||
 922		 (mgmt_class == IB_MGMT_CLASS_BIS))
 923		return IB_MGMT_DEVICE_HDR;
 924	else if ((mgmt_class >= IB_MGMT_CLASS_VENDOR_RANGE2_START) &&
 925		 (mgmt_class <= IB_MGMT_CLASS_VENDOR_RANGE2_END))
 926		return IB_MGMT_VENDOR_HDR;
 927	else
 928		return IB_MGMT_MAD_HDR;
 929}
 930EXPORT_SYMBOL(ib_get_mad_data_offset);
 931
 932int ib_is_mad_class_rmpp(u8 mgmt_class)
 933{
 934	if ((mgmt_class == IB_MGMT_CLASS_SUBN_ADM) ||
 935	    (mgmt_class == IB_MGMT_CLASS_DEVICE_MGMT) ||
 936	    (mgmt_class == IB_MGMT_CLASS_DEVICE_ADM) ||
 937	    (mgmt_class == IB_MGMT_CLASS_BIS) ||
 938	    ((mgmt_class >= IB_MGMT_CLASS_VENDOR_RANGE2_START) &&
 939	     (mgmt_class <= IB_MGMT_CLASS_VENDOR_RANGE2_END)))
 940		return 1;
 941	return 0;
 942}
 943EXPORT_SYMBOL(ib_is_mad_class_rmpp);
 944
 945void *ib_get_rmpp_segment(struct ib_mad_send_buf *send_buf, int seg_num)
 946{
 947	struct ib_mad_send_wr_private *mad_send_wr;
 948	struct list_head *list;
 949
 950	mad_send_wr = container_of(send_buf, struct ib_mad_send_wr_private,
 951				   send_buf);
 952	list = &mad_send_wr->cur_seg->list;
 953
 954	if (mad_send_wr->cur_seg->num < seg_num) {
 955		list_for_each_entry(mad_send_wr->cur_seg, list, list)
 956			if (mad_send_wr->cur_seg->num == seg_num)
 957				break;
 958	} else if (mad_send_wr->cur_seg->num > seg_num) {
 959		list_for_each_entry_reverse(mad_send_wr->cur_seg, list, list)
 960			if (mad_send_wr->cur_seg->num == seg_num)
 961				break;
 962	}
 963	return mad_send_wr->cur_seg->data;
 964}
 965EXPORT_SYMBOL(ib_get_rmpp_segment);
 966
 967static inline void *ib_get_payload(struct ib_mad_send_wr_private *mad_send_wr)
 968{
 969	if (mad_send_wr->send_buf.seg_count)
 970		return ib_get_rmpp_segment(&mad_send_wr->send_buf,
 971					   mad_send_wr->seg_num);
 972	else
 973		return mad_send_wr->send_buf.mad +
 974		       mad_send_wr->send_buf.hdr_len;
 975}
 976
 977void ib_free_send_mad(struct ib_mad_send_buf *send_buf)
 978{
 979	struct ib_mad_agent_private *mad_agent_priv;
 980	struct ib_mad_send_wr_private *mad_send_wr;
 981
 982	mad_agent_priv = container_of(send_buf->mad_agent,
 983				      struct ib_mad_agent_private, agent);
 984	mad_send_wr = container_of(send_buf, struct ib_mad_send_wr_private,
 985				   send_buf);
 986
 987	free_send_rmpp_list(mad_send_wr);
 988	kfree(send_buf->mad);
 989	deref_mad_agent(mad_agent_priv);
 990}
 991EXPORT_SYMBOL(ib_free_send_mad);
 992
 993int ib_send_mad(struct ib_mad_send_wr_private *mad_send_wr)
 994{
 995	struct ib_mad_qp_info *qp_info;
 996	struct list_head *list;
 
 997	struct ib_mad_agent *mad_agent;
 998	struct ib_sge *sge;
 999	unsigned long flags;
1000	int ret;
1001
1002	/* Set WR ID to find mad_send_wr upon completion */
1003	qp_info = mad_send_wr->mad_agent_priv->qp_info;
 
1004	mad_send_wr->mad_list.mad_queue = &qp_info->send_queue;
1005	mad_send_wr->mad_list.cqe.done = ib_mad_send_done;
1006	mad_send_wr->send_wr.wr.wr_cqe = &mad_send_wr->mad_list.cqe;
1007
1008	mad_agent = mad_send_wr->send_buf.mad_agent;
1009	sge = mad_send_wr->sg_list;
1010	sge[0].addr = ib_dma_map_single(mad_agent->device,
1011					mad_send_wr->send_buf.mad,
1012					sge[0].length,
1013					DMA_TO_DEVICE);
1014	if (unlikely(ib_dma_mapping_error(mad_agent->device, sge[0].addr)))
1015		return -ENOMEM;
1016
1017	mad_send_wr->header_mapping = sge[0].addr;
1018
1019	sge[1].addr = ib_dma_map_single(mad_agent->device,
1020					ib_get_payload(mad_send_wr),
1021					sge[1].length,
1022					DMA_TO_DEVICE);
1023	if (unlikely(ib_dma_mapping_error(mad_agent->device, sge[1].addr))) {
1024		ib_dma_unmap_single(mad_agent->device,
1025				    mad_send_wr->header_mapping,
1026				    sge[0].length, DMA_TO_DEVICE);
1027		return -ENOMEM;
1028	}
1029	mad_send_wr->payload_mapping = sge[1].addr;
1030
1031	spin_lock_irqsave(&qp_info->send_queue.lock, flags);
1032	if (qp_info->send_queue.count < qp_info->send_queue.max_active) {
1033		trace_ib_mad_ib_send_mad(mad_send_wr, qp_info);
1034		ret = ib_post_send(mad_agent->qp, &mad_send_wr->send_wr.wr,
1035				   NULL);
1036		list = &qp_info->send_queue.list;
1037	} else {
1038		ret = 0;
1039		list = &qp_info->overflow_list;
1040	}
1041
1042	if (!ret) {
1043		qp_info->send_queue.count++;
1044		list_add_tail(&mad_send_wr->mad_list.list, list);
1045	}
1046	spin_unlock_irqrestore(&qp_info->send_queue.lock, flags);
1047	if (ret) {
1048		ib_dma_unmap_single(mad_agent->device,
1049				    mad_send_wr->header_mapping,
1050				    sge[0].length, DMA_TO_DEVICE);
1051		ib_dma_unmap_single(mad_agent->device,
1052				    mad_send_wr->payload_mapping,
1053				    sge[1].length, DMA_TO_DEVICE);
1054	}
1055	return ret;
1056}
1057
1058/*
1059 * ib_post_send_mad - Posts MAD(s) to the send queue of the QP associated
1060 *  with the registered client
1061 */
1062int ib_post_send_mad(struct ib_mad_send_buf *send_buf,
1063		     struct ib_mad_send_buf **bad_send_buf)
1064{
1065	struct ib_mad_agent_private *mad_agent_priv;
1066	struct ib_mad_send_buf *next_send_buf;
1067	struct ib_mad_send_wr_private *mad_send_wr;
1068	unsigned long flags;
1069	int ret = -EINVAL;
1070
1071	/* Walk list of send WRs and post each on send list */
1072	for (; send_buf; send_buf = next_send_buf) {
 
1073		mad_send_wr = container_of(send_buf,
1074					   struct ib_mad_send_wr_private,
1075					   send_buf);
1076		mad_agent_priv = mad_send_wr->mad_agent_priv;
1077
1078		ret = ib_mad_enforce_security(mad_agent_priv,
1079					      mad_send_wr->send_wr.pkey_index);
1080		if (ret)
1081			goto error;
1082
1083		if (!send_buf->mad_agent->send_handler ||
1084		    (send_buf->timeout_ms &&
1085		     !send_buf->mad_agent->recv_handler)) {
1086			ret = -EINVAL;
1087			goto error;
1088		}
1089
1090		if (!ib_is_mad_class_rmpp(((struct ib_mad_hdr *) send_buf->mad)->mgmt_class)) {
1091			if (mad_agent_priv->agent.rmpp_version) {
1092				ret = -EINVAL;
1093				goto error;
1094			}
1095		}
1096
1097		/*
1098		 * Save pointer to next work request to post in case the
1099		 * current one completes, and the user modifies the work
1100		 * request associated with the completion
1101		 */
1102		next_send_buf = send_buf->next;
1103		mad_send_wr->send_wr.ah = send_buf->ah;
1104
1105		if (((struct ib_mad_hdr *) send_buf->mad)->mgmt_class ==
1106		    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE) {
1107			ret = handle_outgoing_dr_smp(mad_agent_priv,
1108						     mad_send_wr);
1109			if (ret < 0)		/* error */
1110				goto error;
1111			else if (ret == 1)	/* locally consumed */
1112				continue;
1113		}
1114
1115		mad_send_wr->tid = ((struct ib_mad_hdr *) send_buf->mad)->tid;
1116		/* Timeout will be updated after send completes */
1117		mad_send_wr->timeout = msecs_to_jiffies(send_buf->timeout_ms);
1118		mad_send_wr->max_retries = send_buf->retries;
1119		mad_send_wr->retries_left = send_buf->retries;
1120		send_buf->retries = 0;
1121		/* Reference for work request to QP + response */
1122		mad_send_wr->refcount = 1 + (mad_send_wr->timeout > 0);
1123		mad_send_wr->status = IB_WC_SUCCESS;
1124
1125		/* Reference MAD agent until send completes */
1126		refcount_inc(&mad_agent_priv->refcount);
1127		spin_lock_irqsave(&mad_agent_priv->lock, flags);
1128		list_add_tail(&mad_send_wr->agent_list,
1129			      &mad_agent_priv->send_list);
1130		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1131
1132		if (ib_mad_kernel_rmpp_agent(&mad_agent_priv->agent)) {
1133			ret = ib_send_rmpp_mad(mad_send_wr);
1134			if (ret >= 0 && ret != IB_RMPP_RESULT_CONSUMED)
1135				ret = ib_send_mad(mad_send_wr);
1136		} else
1137			ret = ib_send_mad(mad_send_wr);
1138		if (ret < 0) {
1139			/* Fail send request */
1140			spin_lock_irqsave(&mad_agent_priv->lock, flags);
1141			list_del(&mad_send_wr->agent_list);
1142			spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1143			deref_mad_agent(mad_agent_priv);
1144			goto error;
1145		}
1146	}
1147	return 0;
1148error:
1149	if (bad_send_buf)
1150		*bad_send_buf = send_buf;
1151	return ret;
1152}
1153EXPORT_SYMBOL(ib_post_send_mad);
1154
1155/*
1156 * ib_free_recv_mad - Returns data buffers used to receive
1157 *  a MAD to the access layer
1158 */
1159void ib_free_recv_mad(struct ib_mad_recv_wc *mad_recv_wc)
1160{
1161	struct ib_mad_recv_buf *mad_recv_buf, *temp_recv_buf;
1162	struct ib_mad_private_header *mad_priv_hdr;
1163	struct ib_mad_private *priv;
1164	struct list_head free_list;
1165
1166	INIT_LIST_HEAD(&free_list);
1167	list_splice_init(&mad_recv_wc->rmpp_list, &free_list);
1168
1169	list_for_each_entry_safe(mad_recv_buf, temp_recv_buf,
1170					&free_list, list) {
1171		mad_recv_wc = container_of(mad_recv_buf, struct ib_mad_recv_wc,
1172					   recv_buf);
1173		mad_priv_hdr = container_of(mad_recv_wc,
1174					    struct ib_mad_private_header,
1175					    recv_wc);
1176		priv = container_of(mad_priv_hdr, struct ib_mad_private,
1177				    header);
1178		kfree(priv);
1179	}
1180}
1181EXPORT_SYMBOL(ib_free_recv_mad);
1182
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1183static int method_in_use(struct ib_mad_mgmt_method_table **method,
1184			 struct ib_mad_reg_req *mad_reg_req)
1185{
1186	int i;
1187
1188	for_each_set_bit(i, mad_reg_req->method_mask, IB_MGMT_MAX_METHODS) {
1189		if ((*method)->agent[i]) {
1190			pr_err("Method %d already in use\n", i);
1191			return -EINVAL;
1192		}
1193	}
1194	return 0;
1195}
1196
1197static int allocate_method_table(struct ib_mad_mgmt_method_table **method)
1198{
1199	/* Allocate management method table */
1200	*method = kzalloc(sizeof **method, GFP_ATOMIC);
1201	return (*method) ? 0 : (-ENOMEM);
 
 
 
 
 
 
1202}
1203
1204/*
1205 * Check to see if there are any methods still in use
1206 */
1207static int check_method_table(struct ib_mad_mgmt_method_table *method)
1208{
1209	int i;
1210
1211	for (i = 0; i < IB_MGMT_MAX_METHODS; i++)
1212		if (method->agent[i])
1213			return 1;
1214	return 0;
1215}
1216
1217/*
1218 * Check to see if there are any method tables for this class still in use
1219 */
1220static int check_class_table(struct ib_mad_mgmt_class_table *class)
1221{
1222	int i;
1223
1224	for (i = 0; i < MAX_MGMT_CLASS; i++)
1225		if (class->method_table[i])
1226			return 1;
1227	return 0;
1228}
1229
1230static int check_vendor_class(struct ib_mad_mgmt_vendor_class *vendor_class)
1231{
1232	int i;
1233
1234	for (i = 0; i < MAX_MGMT_OUI; i++)
1235		if (vendor_class->method_table[i])
1236			return 1;
1237	return 0;
1238}
1239
1240static int find_vendor_oui(struct ib_mad_mgmt_vendor_class *vendor_class,
1241			   const char *oui)
1242{
1243	int i;
1244
1245	for (i = 0; i < MAX_MGMT_OUI; i++)
1246		/* Is there matching OUI for this vendor class ? */
1247		if (!memcmp(vendor_class->oui[i], oui, 3))
1248			return i;
1249
1250	return -1;
1251}
1252
1253static int check_vendor_table(struct ib_mad_mgmt_vendor_class_table *vendor)
1254{
1255	int i;
1256
1257	for (i = 0; i < MAX_MGMT_VENDOR_RANGE2; i++)
1258		if (vendor->vendor_class[i])
1259			return 1;
1260
1261	return 0;
1262}
1263
1264static void remove_methods_mad_agent(struct ib_mad_mgmt_method_table *method,
1265				     struct ib_mad_agent_private *agent)
1266{
1267	int i;
1268
1269	/* Remove any methods for this mad agent */
1270	for (i = 0; i < IB_MGMT_MAX_METHODS; i++)
1271		if (method->agent[i] == agent)
1272			method->agent[i] = NULL;
 
 
1273}
1274
1275static int add_nonoui_reg_req(struct ib_mad_reg_req *mad_reg_req,
1276			      struct ib_mad_agent_private *agent_priv,
1277			      u8 mgmt_class)
1278{
1279	struct ib_mad_port_private *port_priv;
1280	struct ib_mad_mgmt_class_table **class;
1281	struct ib_mad_mgmt_method_table **method;
1282	int i, ret;
1283
1284	port_priv = agent_priv->qp_info->port_priv;
1285	class = &port_priv->version[mad_reg_req->mgmt_class_version].class;
1286	if (!*class) {
1287		/* Allocate management class table for "new" class version */
1288		*class = kzalloc(sizeof **class, GFP_ATOMIC);
1289		if (!*class) {
 
 
1290			ret = -ENOMEM;
1291			goto error1;
1292		}
1293
1294		/* Allocate method table for this management class */
1295		method = &(*class)->method_table[mgmt_class];
1296		if ((ret = allocate_method_table(method)))
1297			goto error2;
1298	} else {
1299		method = &(*class)->method_table[mgmt_class];
1300		if (!*method) {
1301			/* Allocate method table for this management class */
1302			if ((ret = allocate_method_table(method)))
1303				goto error1;
1304		}
1305	}
1306
1307	/* Now, make sure methods are not already in use */
1308	if (method_in_use(method, mad_reg_req))
1309		goto error3;
1310
1311	/* Finally, add in methods being registered */
1312	for_each_set_bit(i, mad_reg_req->method_mask, IB_MGMT_MAX_METHODS)
1313		(*method)->agent[i] = agent_priv;
1314
1315	return 0;
1316
1317error3:
1318	/* Remove any methods for this mad agent */
1319	remove_methods_mad_agent(*method, agent_priv);
1320	/* Now, check to see if there are any methods in use */
1321	if (!check_method_table(*method)) {
1322		/* If not, release management method table */
1323		kfree(*method);
1324		*method = NULL;
1325	}
1326	ret = -EINVAL;
1327	goto error1;
1328error2:
1329	kfree(*class);
1330	*class = NULL;
1331error1:
1332	return ret;
1333}
1334
1335static int add_oui_reg_req(struct ib_mad_reg_req *mad_reg_req,
1336			   struct ib_mad_agent_private *agent_priv)
1337{
1338	struct ib_mad_port_private *port_priv;
1339	struct ib_mad_mgmt_vendor_class_table **vendor_table;
1340	struct ib_mad_mgmt_vendor_class_table *vendor = NULL;
1341	struct ib_mad_mgmt_vendor_class *vendor_class = NULL;
1342	struct ib_mad_mgmt_method_table **method;
1343	int i, ret = -ENOMEM;
1344	u8 vclass;
1345
1346	/* "New" vendor (with OUI) class */
1347	vclass = vendor_class_index(mad_reg_req->mgmt_class);
1348	port_priv = agent_priv->qp_info->port_priv;
1349	vendor_table = &port_priv->version[
1350				mad_reg_req->mgmt_class_version].vendor;
1351	if (!*vendor_table) {
1352		/* Allocate mgmt vendor class table for "new" class version */
1353		vendor = kzalloc(sizeof *vendor, GFP_ATOMIC);
1354		if (!vendor)
 
 
1355			goto error1;
 
1356
1357		*vendor_table = vendor;
1358	}
1359	if (!(*vendor_table)->vendor_class[vclass]) {
1360		/* Allocate table for this management vendor class */
1361		vendor_class = kzalloc(sizeof *vendor_class, GFP_ATOMIC);
1362		if (!vendor_class)
 
 
1363			goto error2;
 
1364
1365		(*vendor_table)->vendor_class[vclass] = vendor_class;
1366	}
1367	for (i = 0; i < MAX_MGMT_OUI; i++) {
1368		/* Is there matching OUI for this vendor class ? */
1369		if (!memcmp((*vendor_table)->vendor_class[vclass]->oui[i],
1370			    mad_reg_req->oui, 3)) {
1371			method = &(*vendor_table)->vendor_class[
1372						vclass]->method_table[i];
1373			if (!*method)
1374				goto error3;
1375			goto check_in_use;
1376		}
1377	}
1378	for (i = 0; i < MAX_MGMT_OUI; i++) {
1379		/* OUI slot available ? */
1380		if (!is_vendor_oui((*vendor_table)->vendor_class[
1381				vclass]->oui[i])) {
1382			method = &(*vendor_table)->vendor_class[
1383				vclass]->method_table[i];
 
1384			/* Allocate method table for this OUI */
1385			if (!*method) {
1386				ret = allocate_method_table(method);
1387				if (ret)
1388					goto error3;
1389			}
1390			memcpy((*vendor_table)->vendor_class[vclass]->oui[i],
1391			       mad_reg_req->oui, 3);
1392			goto check_in_use;
1393		}
1394	}
1395	dev_err(&agent_priv->agent.device->dev, "All OUI slots in use\n");
1396	goto error3;
1397
1398check_in_use:
1399	/* Now, make sure methods are not already in use */
1400	if (method_in_use(method, mad_reg_req))
1401		goto error4;
1402
1403	/* Finally, add in methods being registered */
1404	for_each_set_bit(i, mad_reg_req->method_mask, IB_MGMT_MAX_METHODS)
1405		(*method)->agent[i] = agent_priv;
1406
1407	return 0;
1408
1409error4:
1410	/* Remove any methods for this mad agent */
1411	remove_methods_mad_agent(*method, agent_priv);
1412	/* Now, check to see if there are any methods in use */
1413	if (!check_method_table(*method)) {
1414		/* If not, release management method table */
1415		kfree(*method);
1416		*method = NULL;
1417	}
1418	ret = -EINVAL;
1419error3:
1420	if (vendor_class) {
1421		(*vendor_table)->vendor_class[vclass] = NULL;
1422		kfree(vendor_class);
1423	}
1424error2:
1425	if (vendor) {
1426		*vendor_table = NULL;
1427		kfree(vendor);
1428	}
1429error1:
1430	return ret;
1431}
1432
1433static void remove_mad_reg_req(struct ib_mad_agent_private *agent_priv)
1434{
1435	struct ib_mad_port_private *port_priv;
1436	struct ib_mad_mgmt_class_table *class;
1437	struct ib_mad_mgmt_method_table *method;
1438	struct ib_mad_mgmt_vendor_class_table *vendor;
1439	struct ib_mad_mgmt_vendor_class *vendor_class;
1440	int index;
1441	u8 mgmt_class;
1442
1443	/*
1444	 * Was MAD registration request supplied
1445	 * with original registration ?
1446	 */
1447	if (!agent_priv->reg_req)
1448		goto out;
 
1449
1450	port_priv = agent_priv->qp_info->port_priv;
1451	mgmt_class = convert_mgmt_class(agent_priv->reg_req->mgmt_class);
1452	class = port_priv->version[
1453			agent_priv->reg_req->mgmt_class_version].class;
1454	if (!class)
1455		goto vendor_check;
1456
1457	method = class->method_table[mgmt_class];
1458	if (method) {
1459		/* Remove any methods for this mad agent */
1460		remove_methods_mad_agent(method, agent_priv);
1461		/* Now, check to see if there are any methods still in use */
1462		if (!check_method_table(method)) {
1463			/* If not, release management method table */
1464			kfree(method);
1465			class->method_table[mgmt_class] = NULL;
1466			/* Any management classes left ? */
1467			if (!check_class_table(class)) {
1468				/* If not, release management class table */
1469				kfree(class);
1470				port_priv->version[
1471					agent_priv->reg_req->
1472					mgmt_class_version].class = NULL;
1473			}
1474		}
1475	}
1476
1477vendor_check:
1478	if (!is_vendor_class(mgmt_class))
1479		goto out;
1480
1481	/* normalize mgmt_class to vendor range 2 */
1482	mgmt_class = vendor_class_index(agent_priv->reg_req->mgmt_class);
1483	vendor = port_priv->version[
1484			agent_priv->reg_req->mgmt_class_version].vendor;
1485
1486	if (!vendor)
1487		goto out;
1488
1489	vendor_class = vendor->vendor_class[mgmt_class];
1490	if (vendor_class) {
1491		index = find_vendor_oui(vendor_class, agent_priv->reg_req->oui);
1492		if (index < 0)
1493			goto out;
1494		method = vendor_class->method_table[index];
1495		if (method) {
1496			/* Remove any methods for this mad agent */
1497			remove_methods_mad_agent(method, agent_priv);
1498			/*
1499			 * Now, check to see if there are
1500			 * any methods still in use
1501			 */
1502			if (!check_method_table(method)) {
1503				/* If not, release management method table */
1504				kfree(method);
1505				vendor_class->method_table[index] = NULL;
1506				memset(vendor_class->oui[index], 0, 3);
1507				/* Any OUIs left ? */
1508				if (!check_vendor_class(vendor_class)) {
1509					/* If not, release vendor class table */
1510					kfree(vendor_class);
1511					vendor->vendor_class[mgmt_class] = NULL;
1512					/* Any other vendor classes left ? */
1513					if (!check_vendor_table(vendor)) {
1514						kfree(vendor);
1515						port_priv->version[
1516							agent_priv->reg_req->
1517							mgmt_class_version].
1518							vendor = NULL;
1519					}
1520				}
1521			}
1522		}
1523	}
1524
1525out:
1526	return;
1527}
1528
1529static struct ib_mad_agent_private *
1530find_mad_agent(struct ib_mad_port_private *port_priv,
1531	       const struct ib_mad_hdr *mad_hdr)
1532{
1533	struct ib_mad_agent_private *mad_agent = NULL;
1534	unsigned long flags;
1535
1536	if (ib_response_mad(mad_hdr)) {
 
1537		u32 hi_tid;
 
1538
1539		/*
1540		 * Routing is based on high 32 bits of transaction ID
1541		 * of MAD.
1542		 */
1543		hi_tid = be64_to_cpu(mad_hdr->tid) >> 32;
1544		rcu_read_lock();
1545		mad_agent = xa_load(&ib_mad_clients, hi_tid);
1546		if (mad_agent && !refcount_inc_not_zero(&mad_agent->refcount))
1547			mad_agent = NULL;
1548		rcu_read_unlock();
 
1549	} else {
1550		struct ib_mad_mgmt_class_table *class;
1551		struct ib_mad_mgmt_method_table *method;
1552		struct ib_mad_mgmt_vendor_class_table *vendor;
1553		struct ib_mad_mgmt_vendor_class *vendor_class;
1554		const struct ib_vendor_mad *vendor_mad;
1555		int index;
1556
1557		spin_lock_irqsave(&port_priv->reg_lock, flags);
1558		/*
1559		 * Routing is based on version, class, and method
1560		 * For "newer" vendor MADs, also based on OUI
1561		 */
1562		if (mad_hdr->class_version >= MAX_MGMT_VERSION)
1563			goto out;
1564		if (!is_vendor_class(mad_hdr->mgmt_class)) {
1565			class = port_priv->version[
1566					mad_hdr->class_version].class;
1567			if (!class)
1568				goto out;
1569			if (convert_mgmt_class(mad_hdr->mgmt_class) >=
1570			    ARRAY_SIZE(class->method_table))
1571				goto out;
1572			method = class->method_table[convert_mgmt_class(
1573							mad_hdr->mgmt_class)];
1574			if (method)
1575				mad_agent = method->agent[mad_hdr->method &
1576							  ~IB_MGMT_METHOD_RESP];
1577		} else {
1578			vendor = port_priv->version[
1579					mad_hdr->class_version].vendor;
1580			if (!vendor)
1581				goto out;
1582			vendor_class = vendor->vendor_class[vendor_class_index(
1583						mad_hdr->mgmt_class)];
1584			if (!vendor_class)
1585				goto out;
1586			/* Find matching OUI */
1587			vendor_mad = (const struct ib_vendor_mad *)mad_hdr;
1588			index = find_vendor_oui(vendor_class, vendor_mad->oui);
1589			if (index == -1)
1590				goto out;
1591			method = vendor_class->method_table[index];
1592			if (method) {
1593				mad_agent = method->agent[mad_hdr->method &
1594							  ~IB_MGMT_METHOD_RESP];
1595			}
1596		}
1597		if (mad_agent)
1598			refcount_inc(&mad_agent->refcount);
1599out:
1600		spin_unlock_irqrestore(&port_priv->reg_lock, flags);
1601	}
1602
1603	if (mad_agent && !mad_agent->agent.recv_handler) {
1604		dev_notice(&port_priv->device->dev,
1605			   "No receive handler for client %p on port %u\n",
1606			   &mad_agent->agent, port_priv->port_num);
1607		deref_mad_agent(mad_agent);
1608		mad_agent = NULL;
 
 
 
1609	}
 
 
1610
1611	return mad_agent;
1612}
1613
1614static int validate_mad(const struct ib_mad_hdr *mad_hdr,
1615			const struct ib_mad_qp_info *qp_info,
1616			bool opa)
1617{
1618	int valid = 0;
1619	u32 qp_num = qp_info->qp->qp_num;
1620
1621	/* Make sure MAD base version is understood */
1622	if (mad_hdr->base_version != IB_MGMT_BASE_VERSION &&
1623	    (!opa || mad_hdr->base_version != OPA_MGMT_BASE_VERSION)) {
1624		pr_err("MAD received with unsupported base version %u %s\n",
1625		       mad_hdr->base_version, opa ? "(opa)" : "");
1626		goto out;
1627	}
1628
1629	/* Filter SMI packets sent to other than QP0 */
1630	if ((mad_hdr->mgmt_class == IB_MGMT_CLASS_SUBN_LID_ROUTED) ||
1631	    (mad_hdr->mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)) {
1632		if (qp_num == 0)
1633			valid = 1;
1634	} else {
1635		/* CM attributes other than ClassPortInfo only use Send method */
1636		if ((mad_hdr->mgmt_class == IB_MGMT_CLASS_CM) &&
1637		    (mad_hdr->attr_id != IB_MGMT_CLASSPORTINFO_ATTR_ID) &&
1638		    (mad_hdr->method != IB_MGMT_METHOD_SEND))
1639			goto out;
1640		/* Filter GSI packets sent to QP0 */
1641		if (qp_num != 0)
1642			valid = 1;
1643	}
1644
1645out:
1646	return valid;
1647}
1648
1649static int is_rmpp_data_mad(const struct ib_mad_agent_private *mad_agent_priv,
1650			    const struct ib_mad_hdr *mad_hdr)
1651{
1652	struct ib_rmpp_mad *rmpp_mad;
1653
1654	rmpp_mad = (struct ib_rmpp_mad *)mad_hdr;
1655	return !mad_agent_priv->agent.rmpp_version ||
1656		!ib_mad_kernel_rmpp_agent(&mad_agent_priv->agent) ||
1657		!(ib_get_rmpp_flags(&rmpp_mad->rmpp_hdr) &
1658				    IB_MGMT_RMPP_FLAG_ACTIVE) ||
1659		(rmpp_mad->rmpp_hdr.rmpp_type == IB_MGMT_RMPP_TYPE_DATA);
1660}
1661
1662static inline int rcv_has_same_class(const struct ib_mad_send_wr_private *wr,
1663				     const struct ib_mad_recv_wc *rwc)
1664{
1665	return ((struct ib_mad_hdr *)(wr->send_buf.mad))->mgmt_class ==
1666		rwc->recv_buf.mad->mad_hdr.mgmt_class;
1667}
1668
1669static inline int
1670rcv_has_same_gid(const struct ib_mad_agent_private *mad_agent_priv,
1671		 const struct ib_mad_send_wr_private *wr,
1672		 const struct ib_mad_recv_wc *rwc)
1673{
1674	struct rdma_ah_attr attr;
1675	u8 send_resp, rcv_resp;
1676	union ib_gid sgid;
1677	struct ib_device *device = mad_agent_priv->agent.device;
1678	u32 port_num = mad_agent_priv->agent.port_num;
1679	u8 lmc;
1680	bool has_grh;
1681
1682	send_resp = ib_response_mad((struct ib_mad_hdr *)wr->send_buf.mad);
1683	rcv_resp = ib_response_mad(&rwc->recv_buf.mad->mad_hdr);
1684
1685	if (send_resp == rcv_resp)
1686		/* both requests, or both responses. GIDs different */
1687		return 0;
1688
1689	if (rdma_query_ah(wr->send_buf.ah, &attr))
1690		/* Assume not equal, to avoid false positives. */
1691		return 0;
1692
1693	has_grh = !!(rdma_ah_get_ah_flags(&attr) & IB_AH_GRH);
1694	if (has_grh != !!(rwc->wc->wc_flags & IB_WC_GRH))
1695		/* one has GID, other does not.  Assume different */
1696		return 0;
1697
1698	if (!send_resp && rcv_resp) {
1699		/* is request/response. */
1700		if (!has_grh) {
1701			if (ib_get_cached_lmc(device, port_num, &lmc))
1702				return 0;
1703			return (!lmc || !((rdma_ah_get_path_bits(&attr) ^
1704					   rwc->wc->dlid_path_bits) &
1705					  ((1 << lmc) - 1)));
1706		} else {
1707			const struct ib_global_route *grh =
1708					rdma_ah_read_grh(&attr);
1709
1710			if (rdma_query_gid(device, port_num,
1711					   grh->sgid_index, &sgid))
1712				return 0;
1713			return !memcmp(sgid.raw, rwc->recv_buf.grh->dgid.raw,
1714				       16);
1715		}
1716	}
1717
1718	if (!has_grh)
1719		return rdma_ah_get_dlid(&attr) == rwc->wc->slid;
1720	else
1721		return !memcmp(rdma_ah_read_grh(&attr)->dgid.raw,
1722			       rwc->recv_buf.grh->sgid.raw,
1723			       16);
1724}
1725
1726static inline int is_direct(u8 class)
1727{
1728	return (class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE);
1729}
1730
1731struct ib_mad_send_wr_private*
1732ib_find_send_mad(const struct ib_mad_agent_private *mad_agent_priv,
1733		 const struct ib_mad_recv_wc *wc)
1734{
1735	struct ib_mad_send_wr_private *wr;
1736	const struct ib_mad_hdr *mad_hdr;
1737
1738	mad_hdr = &wc->recv_buf.mad->mad_hdr;
1739
1740	list_for_each_entry(wr, &mad_agent_priv->wait_list, agent_list) {
1741		if ((wr->tid == mad_hdr->tid) &&
1742		    rcv_has_same_class(wr, wc) &&
1743		    /*
1744		     * Don't check GID for direct routed MADs.
1745		     * These might have permissive LIDs.
1746		     */
1747		    (is_direct(mad_hdr->mgmt_class) ||
1748		     rcv_has_same_gid(mad_agent_priv, wr, wc)))
1749			return (wr->status == IB_WC_SUCCESS) ? wr : NULL;
1750	}
1751
1752	/*
1753	 * It's possible to receive the response before we've
1754	 * been notified that the send has completed
1755	 */
1756	list_for_each_entry(wr, &mad_agent_priv->send_list, agent_list) {
1757		if (is_rmpp_data_mad(mad_agent_priv, wr->send_buf.mad) &&
1758		    wr->tid == mad_hdr->tid &&
1759		    wr->timeout &&
1760		    rcv_has_same_class(wr, wc) &&
1761		    /*
1762		     * Don't check GID for direct routed MADs.
1763		     * These might have permissive LIDs.
1764		     */
1765		    (is_direct(mad_hdr->mgmt_class) ||
1766		     rcv_has_same_gid(mad_agent_priv, wr, wc)))
1767			/* Verify request has not been canceled */
1768			return (wr->status == IB_WC_SUCCESS) ? wr : NULL;
1769	}
1770	return NULL;
1771}
1772
1773void ib_mark_mad_done(struct ib_mad_send_wr_private *mad_send_wr)
1774{
1775	mad_send_wr->timeout = 0;
1776	if (mad_send_wr->refcount == 1)
1777		list_move_tail(&mad_send_wr->agent_list,
1778			      &mad_send_wr->mad_agent_priv->done_list);
1779}
1780
1781static void ib_mad_complete_recv(struct ib_mad_agent_private *mad_agent_priv,
1782				 struct ib_mad_recv_wc *mad_recv_wc)
1783{
1784	struct ib_mad_send_wr_private *mad_send_wr;
1785	struct ib_mad_send_wc mad_send_wc;
1786	unsigned long flags;
1787	int ret;
1788
1789	INIT_LIST_HEAD(&mad_recv_wc->rmpp_list);
1790	ret = ib_mad_enforce_security(mad_agent_priv,
1791				      mad_recv_wc->wc->pkey_index);
1792	if (ret) {
1793		ib_free_recv_mad(mad_recv_wc);
1794		deref_mad_agent(mad_agent_priv);
1795		return;
1796	}
1797
1798	list_add(&mad_recv_wc->recv_buf.list, &mad_recv_wc->rmpp_list);
1799	if (ib_mad_kernel_rmpp_agent(&mad_agent_priv->agent)) {
1800		mad_recv_wc = ib_process_rmpp_recv_wc(mad_agent_priv,
1801						      mad_recv_wc);
1802		if (!mad_recv_wc) {
1803			deref_mad_agent(mad_agent_priv);
1804			return;
1805		}
1806	}
1807
1808	/* Complete corresponding request */
1809	if (ib_response_mad(&mad_recv_wc->recv_buf.mad->mad_hdr)) {
1810		spin_lock_irqsave(&mad_agent_priv->lock, flags);
1811		mad_send_wr = ib_find_send_mad(mad_agent_priv, mad_recv_wc);
1812		if (!mad_send_wr) {
1813			spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1814			if (!ib_mad_kernel_rmpp_agent(&mad_agent_priv->agent)
1815			   && ib_is_mad_class_rmpp(mad_recv_wc->recv_buf.mad->mad_hdr.mgmt_class)
1816			   && (ib_get_rmpp_flags(&((struct ib_rmpp_mad *)mad_recv_wc->recv_buf.mad)->rmpp_hdr)
1817					& IB_MGMT_RMPP_FLAG_ACTIVE)) {
1818				/* user rmpp is in effect
1819				 * and this is an active RMPP MAD
1820				 */
1821				mad_agent_priv->agent.recv_handler(
1822						&mad_agent_priv->agent, NULL,
1823						mad_recv_wc);
1824				deref_mad_agent(mad_agent_priv);
1825			} else {
1826				/* not user rmpp, revert to normal behavior and
1827				 * drop the mad
1828				 */
1829				ib_free_recv_mad(mad_recv_wc);
1830				deref_mad_agent(mad_agent_priv);
1831				return;
1832			}
1833		} else {
1834			ib_mark_mad_done(mad_send_wr);
1835			spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1836
1837			/* Defined behavior is to complete response before request */
1838			mad_agent_priv->agent.recv_handler(
1839					&mad_agent_priv->agent,
1840					&mad_send_wr->send_buf,
1841					mad_recv_wc);
1842			deref_mad_agent(mad_agent_priv);
1843
1844			mad_send_wc.status = IB_WC_SUCCESS;
1845			mad_send_wc.vendor_err = 0;
1846			mad_send_wc.send_buf = &mad_send_wr->send_buf;
1847			ib_mad_complete_send_wr(mad_send_wr, &mad_send_wc);
1848		}
 
 
 
 
 
 
 
 
 
 
 
 
 
1849	} else {
1850		mad_agent_priv->agent.recv_handler(&mad_agent_priv->agent, NULL,
1851						   mad_recv_wc);
1852		deref_mad_agent(mad_agent_priv);
1853	}
1854}
1855
1856static enum smi_action handle_ib_smi(const struct ib_mad_port_private *port_priv,
1857				     const struct ib_mad_qp_info *qp_info,
1858				     const struct ib_wc *wc,
1859				     u32 port_num,
1860				     struct ib_mad_private *recv,
1861				     struct ib_mad_private *response)
1862{
1863	enum smi_forward_action retsmi;
1864	struct ib_smp *smp = (struct ib_smp *)recv->mad;
1865
1866	trace_ib_mad_handle_ib_smi(smp);
1867
1868	if (smi_handle_dr_smp_recv(smp,
1869				   rdma_cap_ib_switch(port_priv->device),
1870				   port_num,
1871				   port_priv->device->phys_port_cnt) ==
1872				   IB_SMI_DISCARD)
1873		return IB_SMI_DISCARD;
1874
1875	retsmi = smi_check_forward_dr_smp(smp);
1876	if (retsmi == IB_SMI_LOCAL)
1877		return IB_SMI_HANDLE;
1878
1879	if (retsmi == IB_SMI_SEND) { /* don't forward */
1880		if (smi_handle_dr_smp_send(smp,
1881					   rdma_cap_ib_switch(port_priv->device),
1882					   port_num) == IB_SMI_DISCARD)
1883			return IB_SMI_DISCARD;
1884
1885		if (smi_check_local_smp(smp, port_priv->device) == IB_SMI_DISCARD)
1886			return IB_SMI_DISCARD;
1887	} else if (rdma_cap_ib_switch(port_priv->device)) {
1888		/* forward case for switches */
1889		memcpy(response, recv, mad_priv_size(response));
1890		response->header.recv_wc.wc = &response->header.wc;
1891		response->header.recv_wc.recv_buf.mad = (struct ib_mad *)response->mad;
1892		response->header.recv_wc.recv_buf.grh = &response->grh;
1893
1894		agent_send_response((const struct ib_mad_hdr *)response->mad,
1895				    &response->grh, wc,
1896				    port_priv->device,
1897				    smi_get_fwd_port(smp),
1898				    qp_info->qp->qp_num,
1899				    response->mad_size,
1900				    false);
1901
1902		return IB_SMI_DISCARD;
1903	}
1904	return IB_SMI_HANDLE;
1905}
1906
1907static bool generate_unmatched_resp(const struct ib_mad_private *recv,
1908				    struct ib_mad_private *response,
1909				    size_t *resp_len, bool opa)
1910{
1911	const struct ib_mad_hdr *recv_hdr = (const struct ib_mad_hdr *)recv->mad;
1912	struct ib_mad_hdr *resp_hdr = (struct ib_mad_hdr *)response->mad;
1913
1914	if (recv_hdr->method == IB_MGMT_METHOD_GET ||
1915	    recv_hdr->method == IB_MGMT_METHOD_SET) {
1916		memcpy(response, recv, mad_priv_size(response));
1917		response->header.recv_wc.wc = &response->header.wc;
1918		response->header.recv_wc.recv_buf.mad = (struct ib_mad *)response->mad;
1919		response->header.recv_wc.recv_buf.grh = &response->grh;
1920		resp_hdr->method = IB_MGMT_METHOD_GET_RESP;
1921		resp_hdr->status = cpu_to_be16(IB_MGMT_MAD_STATUS_UNSUPPORTED_METHOD_ATTRIB);
1922		if (recv_hdr->mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)
1923			resp_hdr->status |= IB_SMP_DIRECTION;
1924
1925		if (opa && recv_hdr->base_version == OPA_MGMT_BASE_VERSION) {
1926			if (recv_hdr->mgmt_class ==
1927			    IB_MGMT_CLASS_SUBN_LID_ROUTED ||
1928			    recv_hdr->mgmt_class ==
1929			    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)
1930				*resp_len = opa_get_smp_header_size(
1931							(struct opa_smp *)recv->mad);
1932			else
1933				*resp_len = sizeof(struct ib_mad_hdr);
1934		}
1935
1936		return true;
1937	} else {
1938		return false;
1939	}
1940}
1941
1942static enum smi_action
1943handle_opa_smi(struct ib_mad_port_private *port_priv,
1944	       struct ib_mad_qp_info *qp_info,
1945	       struct ib_wc *wc,
1946	       u32 port_num,
1947	       struct ib_mad_private *recv,
1948	       struct ib_mad_private *response)
1949{
1950	enum smi_forward_action retsmi;
1951	struct opa_smp *smp = (struct opa_smp *)recv->mad;
1952
1953	trace_ib_mad_handle_opa_smi(smp);
1954
1955	if (opa_smi_handle_dr_smp_recv(smp,
1956				   rdma_cap_ib_switch(port_priv->device),
1957				   port_num,
1958				   port_priv->device->phys_port_cnt) ==
1959				   IB_SMI_DISCARD)
1960		return IB_SMI_DISCARD;
1961
1962	retsmi = opa_smi_check_forward_dr_smp(smp);
1963	if (retsmi == IB_SMI_LOCAL)
1964		return IB_SMI_HANDLE;
1965
1966	if (retsmi == IB_SMI_SEND) { /* don't forward */
1967		if (opa_smi_handle_dr_smp_send(smp,
1968					   rdma_cap_ib_switch(port_priv->device),
1969					   port_num) == IB_SMI_DISCARD)
1970			return IB_SMI_DISCARD;
1971
1972		if (opa_smi_check_local_smp(smp, port_priv->device) ==
1973		    IB_SMI_DISCARD)
1974			return IB_SMI_DISCARD;
1975
1976	} else if (rdma_cap_ib_switch(port_priv->device)) {
1977		/* forward case for switches */
1978		memcpy(response, recv, mad_priv_size(response));
1979		response->header.recv_wc.wc = &response->header.wc;
1980		response->header.recv_wc.recv_buf.opa_mad =
1981				(struct opa_mad *)response->mad;
1982		response->header.recv_wc.recv_buf.grh = &response->grh;
1983
1984		agent_send_response((const struct ib_mad_hdr *)response->mad,
1985				    &response->grh, wc,
1986				    port_priv->device,
1987				    opa_smi_get_fwd_port(smp),
1988				    qp_info->qp->qp_num,
1989				    recv->header.wc.byte_len,
1990				    true);
1991
1992		return IB_SMI_DISCARD;
1993	}
1994
1995	return IB_SMI_HANDLE;
1996}
1997
1998static enum smi_action
1999handle_smi(struct ib_mad_port_private *port_priv,
2000	   struct ib_mad_qp_info *qp_info,
2001	   struct ib_wc *wc,
2002	   u32 port_num,
2003	   struct ib_mad_private *recv,
2004	   struct ib_mad_private *response,
2005	   bool opa)
2006{
2007	struct ib_mad_hdr *mad_hdr = (struct ib_mad_hdr *)recv->mad;
2008
2009	if (opa && mad_hdr->base_version == OPA_MGMT_BASE_VERSION &&
2010	    mad_hdr->class_version == OPA_SM_CLASS_VERSION)
2011		return handle_opa_smi(port_priv, qp_info, wc, port_num, recv,
2012				      response);
2013
2014	return handle_ib_smi(port_priv, qp_info, wc, port_num, recv, response);
2015}
2016
2017static void ib_mad_recv_done(struct ib_cq *cq, struct ib_wc *wc)
2018{
2019	struct ib_mad_port_private *port_priv = cq->cq_context;
2020	struct ib_mad_list_head *mad_list =
2021		container_of(wc->wr_cqe, struct ib_mad_list_head, cqe);
2022	struct ib_mad_qp_info *qp_info;
2023	struct ib_mad_private_header *mad_priv_hdr;
2024	struct ib_mad_private *recv, *response = NULL;
 
2025	struct ib_mad_agent_private *mad_agent;
2026	u32 port_num;
2027	int ret = IB_MAD_RESULT_SUCCESS;
2028	size_t mad_size;
2029	u16 resp_mad_pkey_index = 0;
2030	bool opa;
2031
2032	if (list_empty_careful(&port_priv->port_list))
2033		return;
2034
2035	if (wc->status != IB_WC_SUCCESS) {
2036		/*
2037		 * Receive errors indicate that the QP has entered the error
2038		 * state - error handling/shutdown code will cleanup
2039		 */
2040		return;
2041	}
2042
 
2043	qp_info = mad_list->mad_queue->qp_info;
2044	dequeue_mad(mad_list);
2045
2046	opa = rdma_cap_opa_mad(qp_info->port_priv->device,
2047			       qp_info->port_priv->port_num);
2048
2049	mad_priv_hdr = container_of(mad_list, struct ib_mad_private_header,
2050				    mad_list);
2051	recv = container_of(mad_priv_hdr, struct ib_mad_private, header);
2052	ib_dma_unmap_single(port_priv->device,
2053			    recv->header.mapping,
2054			    mad_priv_dma_size(recv),
 
2055			    DMA_FROM_DEVICE);
2056
2057	/* Setup MAD receive work completion from "normal" work completion */
2058	recv->header.wc = *wc;
2059	recv->header.recv_wc.wc = &recv->header.wc;
2060
2061	if (opa && ((struct ib_mad_hdr *)(recv->mad))->base_version == OPA_MGMT_BASE_VERSION) {
2062		recv->header.recv_wc.mad_len = wc->byte_len - sizeof(struct ib_grh);
2063		recv->header.recv_wc.mad_seg_size = sizeof(struct opa_mad);
2064	} else {
2065		recv->header.recv_wc.mad_len = sizeof(struct ib_mad);
2066		recv->header.recv_wc.mad_seg_size = sizeof(struct ib_mad);
2067	}
2068
2069	recv->header.recv_wc.recv_buf.mad = (struct ib_mad *)recv->mad;
2070	recv->header.recv_wc.recv_buf.grh = &recv->grh;
2071
 
 
 
2072	/* Validate MAD */
2073	if (!validate_mad((const struct ib_mad_hdr *)recv->mad, qp_info, opa))
2074		goto out;
2075
2076	trace_ib_mad_recv_done_handler(qp_info, wc,
2077				       (struct ib_mad_hdr *)recv->mad);
2078
2079	mad_size = recv->mad_size;
2080	response = alloc_mad_private(mad_size, GFP_KERNEL);
2081	if (!response)
2082		goto out;
 
2083
2084	if (rdma_cap_ib_switch(port_priv->device))
2085		port_num = wc->port_num;
2086	else
2087		port_num = port_priv->port_num;
2088
2089	if (((struct ib_mad_hdr *)recv->mad)->mgmt_class ==
2090	    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE) {
2091		if (handle_smi(port_priv, qp_info, wc, port_num, recv,
2092			       response, opa)
2093		    == IB_SMI_DISCARD)
 
 
 
 
2094			goto out;
2095	}
2096
2097	/* Give driver "right of first refusal" on incoming MAD */
2098	if (port_priv->device->ops.process_mad) {
2099		ret = port_priv->device->ops.process_mad(
2100			port_priv->device, 0, port_priv->port_num, wc,
2101			&recv->grh, (const struct ib_mad *)recv->mad,
2102			(struct ib_mad *)response->mad, &mad_size,
2103			&resp_mad_pkey_index);
 
 
2104
2105		if (opa)
2106			wc->pkey_index = resp_mad_pkey_index;
 
 
 
 
 
 
 
 
 
 
 
 
2107
 
 
 
 
 
 
 
 
 
 
 
 
2108		if (ret & IB_MAD_RESULT_SUCCESS) {
2109			if (ret & IB_MAD_RESULT_CONSUMED)
2110				goto out;
2111			if (ret & IB_MAD_RESULT_REPLY) {
2112				agent_send_response((const struct ib_mad_hdr *)response->mad,
2113						    &recv->grh, wc,
2114						    port_priv->device,
2115						    port_num,
2116						    qp_info->qp->qp_num,
2117						    mad_size, opa);
2118				goto out;
2119			}
2120		}
2121	}
2122
2123	mad_agent = find_mad_agent(port_priv, (const struct ib_mad_hdr *)recv->mad);
2124	if (mad_agent) {
2125		trace_ib_mad_recv_done_agent(mad_agent);
2126		ib_mad_complete_recv(mad_agent, &recv->header.recv_wc);
2127		/*
2128		 * recv is freed up in error cases in ib_mad_complete_recv
2129		 * or via recv_handler in ib_mad_complete_recv()
2130		 */
2131		recv = NULL;
2132	} else if ((ret & IB_MAD_RESULT_SUCCESS) &&
2133		   generate_unmatched_resp(recv, response, &mad_size, opa)) {
2134		agent_send_response((const struct ib_mad_hdr *)response->mad, &recv->grh, wc,
2135				    port_priv->device, port_num,
2136				    qp_info->qp->qp_num, mad_size, opa);
2137	}
2138
2139out:
2140	/* Post another receive request for this QP */
2141	if (response) {
2142		ib_mad_post_receive_mads(qp_info, response);
2143		kfree(recv);
 
2144	} else
2145		ib_mad_post_receive_mads(qp_info, recv);
2146}
2147
2148static void adjust_timeout(struct ib_mad_agent_private *mad_agent_priv)
2149{
2150	struct ib_mad_send_wr_private *mad_send_wr;
2151	unsigned long delay;
2152
2153	if (list_empty(&mad_agent_priv->wait_list)) {
2154		cancel_delayed_work(&mad_agent_priv->timed_work);
2155	} else {
2156		mad_send_wr = list_entry(mad_agent_priv->wait_list.next,
2157					 struct ib_mad_send_wr_private,
2158					 agent_list);
2159
2160		if (time_after(mad_agent_priv->timeout,
2161			       mad_send_wr->timeout)) {
2162			mad_agent_priv->timeout = mad_send_wr->timeout;
 
2163			delay = mad_send_wr->timeout - jiffies;
2164			if ((long)delay <= 0)
2165				delay = 1;
2166			mod_delayed_work(mad_agent_priv->qp_info->port_priv->wq,
2167					 &mad_agent_priv->timed_work, delay);
 
2168		}
2169	}
2170}
2171
2172static void wait_for_response(struct ib_mad_send_wr_private *mad_send_wr)
2173{
2174	struct ib_mad_agent_private *mad_agent_priv;
2175	struct ib_mad_send_wr_private *temp_mad_send_wr;
2176	struct list_head *list_item;
2177	unsigned long delay;
2178
2179	mad_agent_priv = mad_send_wr->mad_agent_priv;
2180	list_del(&mad_send_wr->agent_list);
2181
2182	delay = mad_send_wr->timeout;
2183	mad_send_wr->timeout += jiffies;
2184
2185	if (delay) {
2186		list_for_each_prev(list_item, &mad_agent_priv->wait_list) {
2187			temp_mad_send_wr = list_entry(list_item,
2188						struct ib_mad_send_wr_private,
2189						agent_list);
2190			if (time_after(mad_send_wr->timeout,
2191				       temp_mad_send_wr->timeout))
2192				break;
2193		}
2194	} else {
2195		list_item = &mad_agent_priv->wait_list;
2196	}
2197
 
2198	list_add(&mad_send_wr->agent_list, list_item);
2199
2200	/* Reschedule a work item if we have a shorter timeout */
2201	if (mad_agent_priv->wait_list.next == &mad_send_wr->agent_list)
2202		mod_delayed_work(mad_agent_priv->qp_info->port_priv->wq,
2203				 &mad_agent_priv->timed_work, delay);
 
 
2204}
2205
2206void ib_reset_mad_timeout(struct ib_mad_send_wr_private *mad_send_wr,
2207			  unsigned long timeout_ms)
2208{
2209	mad_send_wr->timeout = msecs_to_jiffies(timeout_ms);
2210	wait_for_response(mad_send_wr);
2211}
2212
2213/*
2214 * Process a send work completion
2215 */
2216void ib_mad_complete_send_wr(struct ib_mad_send_wr_private *mad_send_wr,
2217			     struct ib_mad_send_wc *mad_send_wc)
2218{
2219	struct ib_mad_agent_private	*mad_agent_priv;
2220	unsigned long			flags;
2221	int				ret;
2222
2223	mad_agent_priv = mad_send_wr->mad_agent_priv;
2224	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2225	if (ib_mad_kernel_rmpp_agent(&mad_agent_priv->agent)) {
2226		ret = ib_process_rmpp_send_wc(mad_send_wr, mad_send_wc);
2227		if (ret == IB_RMPP_RESULT_CONSUMED)
2228			goto done;
2229	} else
2230		ret = IB_RMPP_RESULT_UNHANDLED;
2231
2232	if (mad_send_wc->status != IB_WC_SUCCESS &&
2233	    mad_send_wr->status == IB_WC_SUCCESS) {
2234		mad_send_wr->status = mad_send_wc->status;
2235		mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2236	}
2237
2238	if (--mad_send_wr->refcount > 0) {
2239		if (mad_send_wr->refcount == 1 && mad_send_wr->timeout &&
2240		    mad_send_wr->status == IB_WC_SUCCESS) {
2241			wait_for_response(mad_send_wr);
2242		}
2243		goto done;
2244	}
2245
2246	/* Remove send from MAD agent and notify client of completion */
2247	list_del(&mad_send_wr->agent_list);
2248	adjust_timeout(mad_agent_priv);
2249	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2250
2251	if (mad_send_wr->status != IB_WC_SUCCESS)
2252		mad_send_wc->status = mad_send_wr->status;
2253	if (ret == IB_RMPP_RESULT_INTERNAL)
2254		ib_rmpp_send_handler(mad_send_wc);
2255	else
2256		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2257						   mad_send_wc);
2258
2259	/* Release reference on agent taken when sending */
2260	deref_mad_agent(mad_agent_priv);
2261	return;
2262done:
2263	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2264}
2265
2266static void ib_mad_send_done(struct ib_cq *cq, struct ib_wc *wc)
 
2267{
2268	struct ib_mad_port_private *port_priv = cq->cq_context;
2269	struct ib_mad_list_head *mad_list =
2270		container_of(wc->wr_cqe, struct ib_mad_list_head, cqe);
2271	struct ib_mad_send_wr_private	*mad_send_wr, *queued_send_wr;
 
2272	struct ib_mad_qp_info		*qp_info;
2273	struct ib_mad_queue		*send_queue;
 
2274	struct ib_mad_send_wc		mad_send_wc;
2275	unsigned long flags;
2276	int ret;
2277
2278	if (list_empty_careful(&port_priv->port_list))
2279		return;
2280
2281	if (wc->status != IB_WC_SUCCESS) {
2282		if (!ib_mad_send_error(port_priv, wc))
2283			return;
2284	}
2285
2286	mad_send_wr = container_of(mad_list, struct ib_mad_send_wr_private,
2287				   mad_list);
2288	send_queue = mad_list->mad_queue;
2289	qp_info = send_queue->qp_info;
2290
2291	trace_ib_mad_send_done_agent(mad_send_wr->mad_agent_priv);
2292	trace_ib_mad_send_done_handler(mad_send_wr, wc);
2293
2294retry:
2295	ib_dma_unmap_single(mad_send_wr->send_buf.mad_agent->device,
2296			    mad_send_wr->header_mapping,
2297			    mad_send_wr->sg_list[0].length, DMA_TO_DEVICE);
2298	ib_dma_unmap_single(mad_send_wr->send_buf.mad_agent->device,
2299			    mad_send_wr->payload_mapping,
2300			    mad_send_wr->sg_list[1].length, DMA_TO_DEVICE);
2301	queued_send_wr = NULL;
2302	spin_lock_irqsave(&send_queue->lock, flags);
2303	list_del(&mad_list->list);
2304
2305	/* Move queued send to the send queue */
2306	if (send_queue->count-- > send_queue->max_active) {
2307		mad_list = container_of(qp_info->overflow_list.next,
2308					struct ib_mad_list_head, list);
2309		queued_send_wr = container_of(mad_list,
2310					struct ib_mad_send_wr_private,
2311					mad_list);
2312		list_move_tail(&mad_list->list, &send_queue->list);
2313	}
2314	spin_unlock_irqrestore(&send_queue->lock, flags);
2315
2316	mad_send_wc.send_buf = &mad_send_wr->send_buf;
2317	mad_send_wc.status = wc->status;
2318	mad_send_wc.vendor_err = wc->vendor_err;
 
 
 
2319	ib_mad_complete_send_wr(mad_send_wr, &mad_send_wc);
2320
2321	if (queued_send_wr) {
2322		trace_ib_mad_send_done_resend(queued_send_wr, qp_info);
2323		ret = ib_post_send(qp_info->qp, &queued_send_wr->send_wr.wr,
2324				   NULL);
2325		if (ret) {
2326			dev_err(&port_priv->device->dev,
2327				"ib_post_send failed: %d\n", ret);
2328			mad_send_wr = queued_send_wr;
2329			wc->status = IB_WC_LOC_QP_OP_ERR;
2330			goto retry;
2331		}
2332	}
2333}
2334
2335static void mark_sends_for_retry(struct ib_mad_qp_info *qp_info)
2336{
2337	struct ib_mad_send_wr_private *mad_send_wr;
2338	struct ib_mad_list_head *mad_list;
2339	unsigned long flags;
2340
2341	spin_lock_irqsave(&qp_info->send_queue.lock, flags);
2342	list_for_each_entry(mad_list, &qp_info->send_queue.list, list) {
2343		mad_send_wr = container_of(mad_list,
2344					   struct ib_mad_send_wr_private,
2345					   mad_list);
2346		mad_send_wr->retry = 1;
2347	}
2348	spin_unlock_irqrestore(&qp_info->send_queue.lock, flags);
2349}
2350
2351static bool ib_mad_send_error(struct ib_mad_port_private *port_priv,
2352		struct ib_wc *wc)
2353{
2354	struct ib_mad_list_head *mad_list =
2355		container_of(wc->wr_cqe, struct ib_mad_list_head, cqe);
2356	struct ib_mad_qp_info *qp_info = mad_list->mad_queue->qp_info;
2357	struct ib_mad_send_wr_private *mad_send_wr;
2358	int ret;
2359
 
 
 
 
 
 
 
 
 
 
2360	/*
2361	 * Send errors will transition the QP to SQE - move
2362	 * QP to RTS and repost flushed work requests
2363	 */
2364	mad_send_wr = container_of(mad_list, struct ib_mad_send_wr_private,
2365				   mad_list);
2366	if (wc->status == IB_WC_WR_FLUSH_ERR) {
2367		if (mad_send_wr->retry) {
2368			/* Repost send */
 
 
2369			mad_send_wr->retry = 0;
2370			trace_ib_mad_error_handler(mad_send_wr, qp_info);
2371			ret = ib_post_send(qp_info->qp, &mad_send_wr->send_wr.wr,
2372					   NULL);
2373			if (!ret)
2374				return false;
2375		}
2376	} else {
2377		struct ib_qp_attr *attr;
2378
2379		/* Transition QP to RTS and fail offending send */
2380		attr = kmalloc(sizeof *attr, GFP_KERNEL);
2381		if (attr) {
2382			attr->qp_state = IB_QPS_RTS;
2383			attr->cur_qp_state = IB_QPS_SQE;
2384			ret = ib_modify_qp(qp_info->qp, attr,
2385					   IB_QP_STATE | IB_QP_CUR_STATE);
2386			kfree(attr);
2387			if (ret)
2388				dev_err(&port_priv->device->dev,
2389					"%s - ib_modify_qp to RTS: %d\n",
2390					__func__, ret);
2391			else
2392				mark_sends_for_retry(qp_info);
2393		}
 
2394	}
 
2395
2396	return true;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2397}
2398
2399static void cancel_mads(struct ib_mad_agent_private *mad_agent_priv)
2400{
2401	unsigned long flags;
2402	struct ib_mad_send_wr_private *mad_send_wr, *temp_mad_send_wr;
2403	struct ib_mad_send_wc mad_send_wc;
2404	struct list_head cancel_list;
2405
2406	INIT_LIST_HEAD(&cancel_list);
2407
2408	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2409	list_for_each_entry_safe(mad_send_wr, temp_mad_send_wr,
2410				 &mad_agent_priv->send_list, agent_list) {
2411		if (mad_send_wr->status == IB_WC_SUCCESS) {
2412			mad_send_wr->status = IB_WC_WR_FLUSH_ERR;
2413			mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2414		}
2415	}
2416
2417	/* Empty wait list to prevent receives from finding a request */
2418	list_splice_init(&mad_agent_priv->wait_list, &cancel_list);
2419	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2420
2421	/* Report all cancelled requests */
2422	mad_send_wc.status = IB_WC_WR_FLUSH_ERR;
2423	mad_send_wc.vendor_err = 0;
2424
2425	list_for_each_entry_safe(mad_send_wr, temp_mad_send_wr,
2426				 &cancel_list, agent_list) {
2427		mad_send_wc.send_buf = &mad_send_wr->send_buf;
2428		list_del(&mad_send_wr->agent_list);
2429		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2430						   &mad_send_wc);
2431		deref_mad_agent(mad_agent_priv);
2432	}
2433}
2434
2435static struct ib_mad_send_wr_private*
2436find_send_wr(struct ib_mad_agent_private *mad_agent_priv,
2437	     struct ib_mad_send_buf *send_buf)
2438{
2439	struct ib_mad_send_wr_private *mad_send_wr;
2440
2441	list_for_each_entry(mad_send_wr, &mad_agent_priv->wait_list,
2442			    agent_list) {
2443		if (&mad_send_wr->send_buf == send_buf)
2444			return mad_send_wr;
2445	}
2446
2447	list_for_each_entry(mad_send_wr, &mad_agent_priv->send_list,
2448			    agent_list) {
2449		if (is_rmpp_data_mad(mad_agent_priv,
2450				     mad_send_wr->send_buf.mad) &&
2451		    &mad_send_wr->send_buf == send_buf)
2452			return mad_send_wr;
2453	}
2454	return NULL;
2455}
2456
2457int ib_modify_mad(struct ib_mad_send_buf *send_buf, u32 timeout_ms)
 
2458{
2459	struct ib_mad_agent_private *mad_agent_priv;
2460	struct ib_mad_send_wr_private *mad_send_wr;
2461	unsigned long flags;
2462	int active;
2463
2464	if (!send_buf)
2465		return -EINVAL;
2466
2467	mad_agent_priv = container_of(send_buf->mad_agent,
2468				      struct ib_mad_agent_private, agent);
2469	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2470	mad_send_wr = find_send_wr(mad_agent_priv, send_buf);
2471	if (!mad_send_wr || mad_send_wr->status != IB_WC_SUCCESS) {
2472		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2473		return -EINVAL;
2474	}
2475
2476	active = (!mad_send_wr->timeout || mad_send_wr->refcount > 1);
2477	if (!timeout_ms) {
2478		mad_send_wr->status = IB_WC_WR_FLUSH_ERR;
2479		mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2480	}
2481
2482	mad_send_wr->send_buf.timeout_ms = timeout_ms;
2483	if (active)
2484		mad_send_wr->timeout = msecs_to_jiffies(timeout_ms);
2485	else
2486		ib_reset_mad_timeout(mad_send_wr, timeout_ms);
2487
2488	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2489	return 0;
2490}
2491EXPORT_SYMBOL(ib_modify_mad);
2492
 
 
 
 
 
 
 
2493static void local_completions(struct work_struct *work)
2494{
2495	struct ib_mad_agent_private *mad_agent_priv;
2496	struct ib_mad_local_private *local;
2497	struct ib_mad_agent_private *recv_mad_agent;
2498	unsigned long flags;
2499	int free_mad;
2500	struct ib_wc wc;
2501	struct ib_mad_send_wc mad_send_wc;
2502	bool opa;
2503
2504	mad_agent_priv =
2505		container_of(work, struct ib_mad_agent_private, local_work);
2506
2507	opa = rdma_cap_opa_mad(mad_agent_priv->qp_info->port_priv->device,
2508			       mad_agent_priv->qp_info->port_priv->port_num);
2509
2510	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2511	while (!list_empty(&mad_agent_priv->local_list)) {
2512		local = list_entry(mad_agent_priv->local_list.next,
2513				   struct ib_mad_local_private,
2514				   completion_list);
2515		list_del(&local->completion_list);
2516		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2517		free_mad = 0;
2518		if (local->mad_priv) {
2519			u8 base_version;
2520			recv_mad_agent = local->recv_mad_agent;
2521			if (!recv_mad_agent) {
2522				dev_err(&mad_agent_priv->agent.device->dev,
2523					"No receive MAD agent for local completion\n");
2524				free_mad = 1;
2525				goto local_send_completion;
2526			}
2527
2528			/*
2529			 * Defined behavior is to complete response
2530			 * before request
2531			 */
2532			build_smp_wc(recv_mad_agent->agent.qp,
2533				     local->mad_send_wr->send_wr.wr.wr_cqe,
2534				     be16_to_cpu(IB_LID_PERMISSIVE),
2535				     local->mad_send_wr->send_wr.pkey_index,
2536				     recv_mad_agent->agent.port_num, &wc);
2537
2538			local->mad_priv->header.recv_wc.wc = &wc;
2539
2540			base_version = ((struct ib_mad_hdr *)(local->mad_priv->mad))->base_version;
2541			if (opa && base_version == OPA_MGMT_BASE_VERSION) {
2542				local->mad_priv->header.recv_wc.mad_len = local->return_wc_byte_len;
2543				local->mad_priv->header.recv_wc.mad_seg_size = sizeof(struct opa_mad);
2544			} else {
2545				local->mad_priv->header.recv_wc.mad_len = sizeof(struct ib_mad);
2546				local->mad_priv->header.recv_wc.mad_seg_size = sizeof(struct ib_mad);
2547			}
2548
2549			INIT_LIST_HEAD(&local->mad_priv->header.recv_wc.rmpp_list);
2550			list_add(&local->mad_priv->header.recv_wc.recv_buf.list,
2551				 &local->mad_priv->header.recv_wc.rmpp_list);
2552			local->mad_priv->header.recv_wc.recv_buf.grh = NULL;
2553			local->mad_priv->header.recv_wc.recv_buf.mad =
2554						(struct ib_mad *)local->mad_priv->mad;
 
 
 
 
2555			recv_mad_agent->agent.recv_handler(
2556						&recv_mad_agent->agent,
2557						&local->mad_send_wr->send_buf,
2558						&local->mad_priv->header.recv_wc);
2559			spin_lock_irqsave(&recv_mad_agent->lock, flags);
2560			deref_mad_agent(recv_mad_agent);
2561			spin_unlock_irqrestore(&recv_mad_agent->lock, flags);
2562		}
2563
2564local_send_completion:
2565		/* Complete send */
2566		mad_send_wc.status = IB_WC_SUCCESS;
2567		mad_send_wc.vendor_err = 0;
2568		mad_send_wc.send_buf = &local->mad_send_wr->send_buf;
 
 
 
 
2569		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2570						   &mad_send_wc);
2571
2572		spin_lock_irqsave(&mad_agent_priv->lock, flags);
2573		deref_mad_agent(mad_agent_priv);
2574		if (free_mad)
2575			kfree(local->mad_priv);
2576		kfree(local);
2577	}
2578	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2579}
2580
2581static int retry_send(struct ib_mad_send_wr_private *mad_send_wr)
2582{
2583	int ret;
2584
2585	if (!mad_send_wr->retries_left)
2586		return -ETIMEDOUT;
2587
2588	mad_send_wr->retries_left--;
2589	mad_send_wr->send_buf.retries++;
2590
2591	mad_send_wr->timeout = msecs_to_jiffies(mad_send_wr->send_buf.timeout_ms);
2592
2593	if (ib_mad_kernel_rmpp_agent(&mad_send_wr->mad_agent_priv->agent)) {
2594		ret = ib_retry_rmpp(mad_send_wr);
2595		switch (ret) {
2596		case IB_RMPP_RESULT_UNHANDLED:
2597			ret = ib_send_mad(mad_send_wr);
2598			break;
2599		case IB_RMPP_RESULT_CONSUMED:
2600			ret = 0;
2601			break;
2602		default:
2603			ret = -ECOMM;
2604			break;
2605		}
2606	} else
2607		ret = ib_send_mad(mad_send_wr);
2608
2609	if (!ret) {
2610		mad_send_wr->refcount++;
2611		list_add_tail(&mad_send_wr->agent_list,
2612			      &mad_send_wr->mad_agent_priv->send_list);
2613	}
2614	return ret;
2615}
2616
2617static void timeout_sends(struct work_struct *work)
2618{
2619	struct ib_mad_agent_private *mad_agent_priv;
2620	struct ib_mad_send_wr_private *mad_send_wr;
2621	struct ib_mad_send_wc mad_send_wc;
2622	unsigned long flags, delay;
2623
2624	mad_agent_priv = container_of(work, struct ib_mad_agent_private,
2625				      timed_work.work);
2626	mad_send_wc.vendor_err = 0;
2627
2628	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2629	while (!list_empty(&mad_agent_priv->wait_list)) {
2630		mad_send_wr = list_entry(mad_agent_priv->wait_list.next,
2631					 struct ib_mad_send_wr_private,
2632					 agent_list);
2633
2634		if (time_after(mad_send_wr->timeout, jiffies)) {
2635			delay = mad_send_wr->timeout - jiffies;
2636			if ((long)delay <= 0)
2637				delay = 1;
2638			queue_delayed_work(mad_agent_priv->qp_info->
2639					   port_priv->wq,
2640					   &mad_agent_priv->timed_work, delay);
2641			break;
2642		}
2643
2644		list_del(&mad_send_wr->agent_list);
2645		if (mad_send_wr->status == IB_WC_SUCCESS &&
2646		    !retry_send(mad_send_wr))
2647			continue;
2648
2649		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2650
2651		if (mad_send_wr->status == IB_WC_SUCCESS)
2652			mad_send_wc.status = IB_WC_RESP_TIMEOUT_ERR;
2653		else
2654			mad_send_wc.status = mad_send_wr->status;
2655		mad_send_wc.send_buf = &mad_send_wr->send_buf;
2656		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2657						   &mad_send_wc);
2658
2659		deref_mad_agent(mad_agent_priv);
2660		spin_lock_irqsave(&mad_agent_priv->lock, flags);
2661	}
2662	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2663}
2664
 
 
 
 
 
 
 
 
 
 
 
2665/*
2666 * Allocate receive MADs and post receive WRs for them
2667 */
2668static int ib_mad_post_receive_mads(struct ib_mad_qp_info *qp_info,
2669				    struct ib_mad_private *mad)
2670{
2671	unsigned long flags;
2672	int post, ret;
2673	struct ib_mad_private *mad_priv;
2674	struct ib_sge sg_list;
2675	struct ib_recv_wr recv_wr;
2676	struct ib_mad_queue *recv_queue = &qp_info->recv_queue;
2677
2678	/* Initialize common scatter list fields */
2679	sg_list.lkey = qp_info->port_priv->pd->local_dma_lkey;
 
2680
2681	/* Initialize common receive WR fields */
2682	recv_wr.next = NULL;
2683	recv_wr.sg_list = &sg_list;
2684	recv_wr.num_sge = 1;
2685
2686	do {
2687		/* Allocate and map receive buffer */
2688		if (mad) {
2689			mad_priv = mad;
2690			mad = NULL;
2691		} else {
2692			mad_priv = alloc_mad_private(port_mad_size(qp_info->port_priv),
2693						     GFP_ATOMIC);
2694			if (!mad_priv) {
 
2695				ret = -ENOMEM;
2696				break;
2697			}
2698		}
2699		sg_list.length = mad_priv_dma_size(mad_priv);
2700		sg_list.addr = ib_dma_map_single(qp_info->port_priv->device,
2701						 &mad_priv->grh,
2702						 mad_priv_dma_size(mad_priv),
 
2703						 DMA_FROM_DEVICE);
2704		if (unlikely(ib_dma_mapping_error(qp_info->port_priv->device,
2705						  sg_list.addr))) {
2706			kfree(mad_priv);
2707			ret = -ENOMEM;
2708			break;
2709		}
2710		mad_priv->header.mapping = sg_list.addr;
 
2711		mad_priv->header.mad_list.mad_queue = recv_queue;
2712		mad_priv->header.mad_list.cqe.done = ib_mad_recv_done;
2713		recv_wr.wr_cqe = &mad_priv->header.mad_list.cqe;
2714
2715		/* Post receive WR */
2716		spin_lock_irqsave(&recv_queue->lock, flags);
2717		post = (++recv_queue->count < recv_queue->max_active);
2718		list_add_tail(&mad_priv->header.mad_list.list, &recv_queue->list);
2719		spin_unlock_irqrestore(&recv_queue->lock, flags);
2720		ret = ib_post_recv(qp_info->qp, &recv_wr, NULL);
2721		if (ret) {
2722			spin_lock_irqsave(&recv_queue->lock, flags);
2723			list_del(&mad_priv->header.mad_list.list);
2724			recv_queue->count--;
2725			spin_unlock_irqrestore(&recv_queue->lock, flags);
2726			ib_dma_unmap_single(qp_info->port_priv->device,
2727					    mad_priv->header.mapping,
2728					    mad_priv_dma_size(mad_priv),
 
2729					    DMA_FROM_DEVICE);
2730			kfree(mad_priv);
2731			dev_err(&qp_info->port_priv->device->dev,
2732				"ib_post_recv failed: %d\n", ret);
2733			break;
2734		}
2735	} while (post);
2736
2737	return ret;
2738}
2739
2740/*
2741 * Return all the posted receive MADs
2742 */
2743static void cleanup_recv_queue(struct ib_mad_qp_info *qp_info)
2744{
2745	struct ib_mad_private_header *mad_priv_hdr;
2746	struct ib_mad_private *recv;
2747	struct ib_mad_list_head *mad_list;
2748
2749	if (!qp_info->qp)
2750		return;
2751
2752	while (!list_empty(&qp_info->recv_queue.list)) {
2753
2754		mad_list = list_entry(qp_info->recv_queue.list.next,
2755				      struct ib_mad_list_head, list);
2756		mad_priv_hdr = container_of(mad_list,
2757					    struct ib_mad_private_header,
2758					    mad_list);
2759		recv = container_of(mad_priv_hdr, struct ib_mad_private,
2760				    header);
2761
2762		/* Remove from posted receive MAD list */
2763		list_del(&mad_list->list);
2764
2765		ib_dma_unmap_single(qp_info->port_priv->device,
2766				    recv->header.mapping,
2767				    mad_priv_dma_size(recv),
 
2768				    DMA_FROM_DEVICE);
2769		kfree(recv);
2770	}
2771
2772	qp_info->recv_queue.count = 0;
2773}
2774
2775/*
2776 * Start the port
2777 */
2778static int ib_mad_port_start(struct ib_mad_port_private *port_priv)
2779{
2780	int ret, i;
2781	struct ib_qp_attr *attr;
2782	struct ib_qp *qp;
2783	u16 pkey_index;
2784
2785	attr = kmalloc(sizeof *attr, GFP_KERNEL);
2786	if (!attr)
 
2787		return -ENOMEM;
2788
2789	ret = ib_find_pkey(port_priv->device, port_priv->port_num,
2790			   IB_DEFAULT_PKEY_FULL, &pkey_index);
2791	if (ret)
2792		pkey_index = 0;
2793
2794	for (i = 0; i < IB_MAD_QPS_CORE; i++) {
2795		qp = port_priv->qp_info[i].qp;
2796		if (!qp)
2797			continue;
2798
2799		/*
2800		 * PKey index for QP1 is irrelevant but
2801		 * one is needed for the Reset to Init transition
2802		 */
2803		attr->qp_state = IB_QPS_INIT;
2804		attr->pkey_index = pkey_index;
2805		attr->qkey = (qp->qp_num == 0) ? 0 : IB_QP1_QKEY;
2806		ret = ib_modify_qp(qp, attr, IB_QP_STATE |
2807					     IB_QP_PKEY_INDEX | IB_QP_QKEY);
2808		if (ret) {
2809			dev_err(&port_priv->device->dev,
2810				"Couldn't change QP%d state to INIT: %d\n",
2811				i, ret);
2812			goto out;
2813		}
2814
2815		attr->qp_state = IB_QPS_RTR;
2816		ret = ib_modify_qp(qp, attr, IB_QP_STATE);
2817		if (ret) {
2818			dev_err(&port_priv->device->dev,
2819				"Couldn't change QP%d state to RTR: %d\n",
2820				i, ret);
2821			goto out;
2822		}
2823
2824		attr->qp_state = IB_QPS_RTS;
2825		attr->sq_psn = IB_MAD_SEND_Q_PSN;
2826		ret = ib_modify_qp(qp, attr, IB_QP_STATE | IB_QP_SQ_PSN);
2827		if (ret) {
2828			dev_err(&port_priv->device->dev,
2829				"Couldn't change QP%d state to RTS: %d\n",
2830				i, ret);
2831			goto out;
2832		}
2833	}
2834
2835	ret = ib_req_notify_cq(port_priv->cq, IB_CQ_NEXT_COMP);
2836	if (ret) {
2837		dev_err(&port_priv->device->dev,
2838			"Failed to request completion notification: %d\n",
2839			ret);
2840		goto out;
2841	}
2842
2843	for (i = 0; i < IB_MAD_QPS_CORE; i++) {
2844		if (!port_priv->qp_info[i].qp)
2845			continue;
2846
2847		ret = ib_mad_post_receive_mads(&port_priv->qp_info[i], NULL);
2848		if (ret) {
2849			dev_err(&port_priv->device->dev,
2850				"Couldn't post receive WRs\n");
2851			goto out;
2852		}
2853	}
2854out:
2855	kfree(attr);
2856	return ret;
2857}
2858
2859static void qp_event_handler(struct ib_event *event, void *qp_context)
2860{
2861	struct ib_mad_qp_info	*qp_info = qp_context;
2862
2863	/* It's worse than that! He's dead, Jim! */
2864	dev_err(&qp_info->port_priv->device->dev,
2865		"Fatal error (%d) on MAD QP (%u)\n",
2866		event->event, qp_info->qp->qp_num);
2867}
2868
2869static void init_mad_queue(struct ib_mad_qp_info *qp_info,
2870			   struct ib_mad_queue *mad_queue)
2871{
2872	mad_queue->qp_info = qp_info;
2873	mad_queue->count = 0;
2874	spin_lock_init(&mad_queue->lock);
2875	INIT_LIST_HEAD(&mad_queue->list);
2876}
2877
2878static void init_mad_qp(struct ib_mad_port_private *port_priv,
2879			struct ib_mad_qp_info *qp_info)
2880{
2881	qp_info->port_priv = port_priv;
2882	init_mad_queue(qp_info, &qp_info->send_queue);
2883	init_mad_queue(qp_info, &qp_info->recv_queue);
2884	INIT_LIST_HEAD(&qp_info->overflow_list);
 
 
 
 
2885}
2886
2887static int create_mad_qp(struct ib_mad_qp_info *qp_info,
2888			 enum ib_qp_type qp_type)
2889{
2890	struct ib_qp_init_attr	qp_init_attr;
2891	int ret;
2892
2893	memset(&qp_init_attr, 0, sizeof qp_init_attr);
2894	qp_init_attr.send_cq = qp_info->port_priv->cq;
2895	qp_init_attr.recv_cq = qp_info->port_priv->cq;
2896	qp_init_attr.sq_sig_type = IB_SIGNAL_ALL_WR;
2897	qp_init_attr.cap.max_send_wr = mad_sendq_size;
2898	qp_init_attr.cap.max_recv_wr = mad_recvq_size;
2899	qp_init_attr.cap.max_send_sge = IB_MAD_SEND_REQ_MAX_SG;
2900	qp_init_attr.cap.max_recv_sge = IB_MAD_RECV_REQ_MAX_SG;
2901	qp_init_attr.qp_type = qp_type;
2902	qp_init_attr.port_num = qp_info->port_priv->port_num;
2903	qp_init_attr.qp_context = qp_info;
2904	qp_init_attr.event_handler = qp_event_handler;
2905	qp_info->qp = ib_create_qp(qp_info->port_priv->pd, &qp_init_attr);
2906	if (IS_ERR(qp_info->qp)) {
2907		dev_err(&qp_info->port_priv->device->dev,
2908			"Couldn't create ib_mad QP%d\n",
2909			get_spl_qp_index(qp_type));
2910		ret = PTR_ERR(qp_info->qp);
2911		goto error;
2912	}
2913	/* Use minimum queue sizes unless the CQ is resized */
2914	qp_info->send_queue.max_active = mad_sendq_size;
2915	qp_info->recv_queue.max_active = mad_recvq_size;
2916	return 0;
2917
2918error:
2919	return ret;
2920}
2921
2922static void destroy_mad_qp(struct ib_mad_qp_info *qp_info)
2923{
2924	if (!qp_info->qp)
2925		return;
2926
2927	ib_destroy_qp(qp_info->qp);
 
2928}
2929
2930/*
2931 * Open the port
2932 * Create the QP, PD, MR, and CQ if needed
2933 */
2934static int ib_mad_port_open(struct ib_device *device,
2935			    u32 port_num)
2936{
2937	int ret, cq_size;
2938	struct ib_mad_port_private *port_priv;
2939	unsigned long flags;
2940	char name[sizeof "ib_mad123"];
2941	int has_smi;
2942
2943	if (WARN_ON(rdma_max_mad_size(device, port_num) < IB_MGMT_MAD_SIZE))
2944		return -EFAULT;
2945
2946	if (WARN_ON(rdma_cap_opa_mad(device, port_num) &&
2947		    rdma_max_mad_size(device, port_num) < OPA_MGMT_MAD_SIZE))
2948		return -EFAULT;
2949
2950	/* Create new device info */
2951	port_priv = kzalloc(sizeof *port_priv, GFP_KERNEL);
2952	if (!port_priv)
 
2953		return -ENOMEM;
 
2954
2955	port_priv->device = device;
2956	port_priv->port_num = port_num;
2957	spin_lock_init(&port_priv->reg_lock);
 
2958	init_mad_qp(port_priv, &port_priv->qp_info[0]);
2959	init_mad_qp(port_priv, &port_priv->qp_info[1]);
2960
2961	cq_size = mad_sendq_size + mad_recvq_size;
2962	has_smi = rdma_cap_ib_smi(device, port_num);
2963	if (has_smi)
2964		cq_size *= 2;
2965
2966	port_priv->pd = ib_alloc_pd(device, 0);
2967	if (IS_ERR(port_priv->pd)) {
2968		dev_err(&device->dev, "Couldn't create ib_mad PD\n");
2969		ret = PTR_ERR(port_priv->pd);
 
 
2970		goto error3;
2971	}
2972
2973	port_priv->cq = ib_alloc_cq(port_priv->device, port_priv, cq_size, 0,
2974			IB_POLL_UNBOUND_WORKQUEUE);
2975	if (IS_ERR(port_priv->cq)) {
2976		dev_err(&device->dev, "Couldn't create ib_mad CQ\n");
2977		ret = PTR_ERR(port_priv->cq);
2978		goto error4;
2979	}
2980
 
 
 
 
 
 
 
2981	if (has_smi) {
2982		ret = create_mad_qp(&port_priv->qp_info[0], IB_QPT_SMI);
2983		if (ret)
2984			goto error6;
2985	}
2986	ret = create_mad_qp(&port_priv->qp_info[1], IB_QPT_GSI);
2987	if (ret)
2988		goto error7;
2989
2990	snprintf(name, sizeof(name), "ib_mad%u", port_num);
2991	port_priv->wq = alloc_ordered_workqueue(name, WQ_MEM_RECLAIM);
2992	if (!port_priv->wq) {
2993		ret = -ENOMEM;
2994		goto error8;
2995	}
 
2996
2997	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2998	list_add_tail(&port_priv->port_list, &ib_mad_port_list);
2999	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
3000
3001	ret = ib_mad_port_start(port_priv);
3002	if (ret) {
3003		dev_err(&device->dev, "Couldn't start port\n");
3004		goto error9;
3005	}
3006
3007	return 0;
3008
3009error9:
3010	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
3011	list_del_init(&port_priv->port_list);
3012	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
3013
3014	destroy_workqueue(port_priv->wq);
3015error8:
3016	destroy_mad_qp(&port_priv->qp_info[1]);
3017error7:
3018	destroy_mad_qp(&port_priv->qp_info[0]);
3019error6:
3020	ib_free_cq(port_priv->cq);
 
 
 
 
3021	cleanup_recv_queue(&port_priv->qp_info[1]);
3022	cleanup_recv_queue(&port_priv->qp_info[0]);
3023error4:
3024	ib_dealloc_pd(port_priv->pd);
3025error3:
3026	kfree(port_priv);
3027
3028	return ret;
3029}
3030
3031/*
3032 * Close the port
3033 * If there are no classes using the port, free the port
3034 * resources (CQ, MR, PD, QP) and remove the port's info structure
3035 */
3036static int ib_mad_port_close(struct ib_device *device, u32 port_num)
3037{
3038	struct ib_mad_port_private *port_priv;
3039	unsigned long flags;
3040
3041	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
3042	port_priv = __ib_get_mad_port(device, port_num);
3043	if (port_priv == NULL) {
3044		spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
3045		dev_err(&device->dev, "Port %u not found\n", port_num);
3046		return -ENODEV;
3047	}
3048	list_del_init(&port_priv->port_list);
3049	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
3050
3051	destroy_workqueue(port_priv->wq);
3052	destroy_mad_qp(&port_priv->qp_info[1]);
3053	destroy_mad_qp(&port_priv->qp_info[0]);
3054	ib_free_cq(port_priv->cq);
3055	ib_dealloc_pd(port_priv->pd);
 
3056	cleanup_recv_queue(&port_priv->qp_info[1]);
3057	cleanup_recv_queue(&port_priv->qp_info[0]);
3058	/* XXX: Handle deallocation of MAD registration tables */
3059
3060	kfree(port_priv);
3061
3062	return 0;
3063}
3064
3065static int ib_mad_init_device(struct ib_device *device)
3066{
3067	int start, i;
3068	unsigned int count = 0;
3069	int ret;
3070
3071	start = rdma_start_port(device);
 
3072
3073	for (i = start; i <= rdma_end_port(device); i++) {
3074		if (!rdma_cap_ib_mad(device, i))
3075			continue;
 
 
 
 
3076
3077		ret = ib_mad_port_open(device, i);
3078		if (ret) {
3079			dev_err(&device->dev, "Couldn't open port %d\n", i);
 
3080			goto error;
3081		}
3082		ret = ib_agent_port_open(device, i);
3083		if (ret) {
3084			dev_err(&device->dev,
3085				"Couldn't open port %d for agents\n", i);
3086			goto error_agent;
3087		}
3088		count++;
3089	}
3090	if (!count)
3091		return -EOPNOTSUPP;
3092
3093	return 0;
3094
3095error_agent:
3096	if (ib_mad_port_close(device, i))
3097		dev_err(&device->dev, "Couldn't close port %d\n", i);
 
3098
3099error:
3100	while (--i >= start) {
3101		if (!rdma_cap_ib_mad(device, i))
3102			continue;
3103
 
3104		if (ib_agent_port_close(device, i))
3105			dev_err(&device->dev,
3106				"Couldn't close port %d for agents\n", i);
 
3107		if (ib_mad_port_close(device, i))
3108			dev_err(&device->dev, "Couldn't close port %d\n", i);
 
 
3109	}
3110	return ret;
3111}
3112
3113static void ib_mad_remove_device(struct ib_device *device, void *client_data)
3114{
3115	unsigned int i;
3116
3117	rdma_for_each_port (device, i) {
3118		if (!rdma_cap_ib_mad(device, i))
3119			continue;
3120
3121		if (ib_agent_port_close(device, i))
3122			dev_err(&device->dev,
3123				"Couldn't close port %u for agents\n", i);
3124		if (ib_mad_port_close(device, i))
3125			dev_err(&device->dev, "Couldn't close port %u\n", i);
 
 
 
 
 
 
 
 
 
 
3126	}
3127}
3128
3129static struct ib_client mad_client = {
3130	.name   = "mad",
3131	.add = ib_mad_init_device,
3132	.remove = ib_mad_remove_device
3133};
3134
3135int ib_mad_init(void)
3136{
 
 
3137	mad_recvq_size = min(mad_recvq_size, IB_MAD_QP_MAX_SIZE);
3138	mad_recvq_size = max(mad_recvq_size, IB_MAD_QP_MIN_SIZE);
3139
3140	mad_sendq_size = min(mad_sendq_size, IB_MAD_QP_MAX_SIZE);
3141	mad_sendq_size = max(mad_sendq_size, IB_MAD_QP_MIN_SIZE);
3142
 
 
 
 
 
 
 
 
 
 
 
3143	INIT_LIST_HEAD(&ib_mad_port_list);
3144
3145	if (ib_register_client(&mad_client)) {
3146		pr_err("Couldn't register ib_mad client\n");
3147		return -EINVAL;
 
3148	}
3149
3150	return 0;
 
 
 
 
 
3151}
3152
3153void ib_mad_cleanup(void)
3154{
3155	ib_unregister_client(&mad_client);
 
3156}
v3.5.6
   1/*
   2 * Copyright (c) 2004-2007 Voltaire, Inc. All rights reserved.
   3 * Copyright (c) 2005 Intel Corporation.  All rights reserved.
   4 * Copyright (c) 2005 Mellanox Technologies Ltd.  All rights reserved.
   5 * Copyright (c) 2009 HNR Consulting. All rights reserved.
 
   6 *
   7 * This software is available to you under a choice of one of two
   8 * licenses.  You may choose to be licensed under the terms of the GNU
   9 * General Public License (GPL) Version 2, available from the file
  10 * COPYING in the main directory of this source tree, or the
  11 * OpenIB.org BSD license below:
  12 *
  13 *     Redistribution and use in source and binary forms, with or
  14 *     without modification, are permitted provided that the following
  15 *     conditions are met:
  16 *
  17 *      - Redistributions of source code must retain the above
  18 *        copyright notice, this list of conditions and the following
  19 *        disclaimer.
  20 *
  21 *      - Redistributions in binary form must reproduce the above
  22 *        copyright notice, this list of conditions and the following
  23 *        disclaimer in the documentation and/or other materials
  24 *        provided with the distribution.
  25 *
  26 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  27 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  28 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  29 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  30 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  31 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  32 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  33 * SOFTWARE.
  34 *
  35 */
 
 
 
  36#include <linux/dma-mapping.h>
  37#include <linux/slab.h>
  38#include <linux/module.h>
 
 
  39#include <rdma/ib_cache.h>
  40
  41#include "mad_priv.h"
 
  42#include "mad_rmpp.h"
  43#include "smi.h"
 
  44#include "agent.h"
  45
  46MODULE_LICENSE("Dual BSD/GPL");
  47MODULE_DESCRIPTION("kernel IB MAD API");
  48MODULE_AUTHOR("Hal Rosenstock");
  49MODULE_AUTHOR("Sean Hefty");
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
  50
  51static int mad_sendq_size = IB_MAD_QP_SEND_SIZE;
  52static int mad_recvq_size = IB_MAD_QP_RECV_SIZE;
  53
  54module_param_named(send_queue_size, mad_sendq_size, int, 0444);
  55MODULE_PARM_DESC(send_queue_size, "Size of send queue in number of work requests");
  56module_param_named(recv_queue_size, mad_recvq_size, int, 0444);
  57MODULE_PARM_DESC(recv_queue_size, "Size of receive queue in number of work requests");
  58
  59static struct kmem_cache *ib_mad_cache;
  60
  61static struct list_head ib_mad_port_list;
  62static u32 ib_mad_client_id = 0;
  63
  64/* Port list lock */
  65static DEFINE_SPINLOCK(ib_mad_port_list_lock);
  66
  67/* Forward declarations */
  68static int method_in_use(struct ib_mad_mgmt_method_table **method,
  69			 struct ib_mad_reg_req *mad_reg_req);
  70static void remove_mad_reg_req(struct ib_mad_agent_private *priv);
  71static struct ib_mad_agent_private *find_mad_agent(
  72					struct ib_mad_port_private *port_priv,
  73					struct ib_mad *mad);
  74static int ib_mad_post_receive_mads(struct ib_mad_qp_info *qp_info,
  75				    struct ib_mad_private *mad);
  76static void cancel_mads(struct ib_mad_agent_private *mad_agent_priv);
  77static void timeout_sends(struct work_struct *work);
  78static void local_completions(struct work_struct *work);
  79static int add_nonoui_reg_req(struct ib_mad_reg_req *mad_reg_req,
  80			      struct ib_mad_agent_private *agent_priv,
  81			      u8 mgmt_class);
  82static int add_oui_reg_req(struct ib_mad_reg_req *mad_reg_req,
  83			   struct ib_mad_agent_private *agent_priv);
 
 
 
  84
  85/*
  86 * Returns a ib_mad_port_private structure or NULL for a device/port
  87 * Assumes ib_mad_port_list_lock is being held
  88 */
  89static inline struct ib_mad_port_private *
  90__ib_get_mad_port(struct ib_device *device, int port_num)
  91{
  92	struct ib_mad_port_private *entry;
  93
  94	list_for_each_entry(entry, &ib_mad_port_list, port_list) {
  95		if (entry->device == device && entry->port_num == port_num)
  96			return entry;
  97	}
  98	return NULL;
  99}
 100
 101/*
 102 * Wrapper function to return a ib_mad_port_private structure or NULL
 103 * for a device/port
 104 */
 105static inline struct ib_mad_port_private *
 106ib_get_mad_port(struct ib_device *device, int port_num)
 107{
 108	struct ib_mad_port_private *entry;
 109	unsigned long flags;
 110
 111	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
 112	entry = __ib_get_mad_port(device, port_num);
 113	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
 114
 115	return entry;
 116}
 117
 118static inline u8 convert_mgmt_class(u8 mgmt_class)
 119{
 120	/* Alias IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE to 0 */
 121	return mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE ?
 122		0 : mgmt_class;
 123}
 124
 125static int get_spl_qp_index(enum ib_qp_type qp_type)
 126{
 127	switch (qp_type)
 128	{
 129	case IB_QPT_SMI:
 130		return 0;
 131	case IB_QPT_GSI:
 132		return 1;
 133	default:
 134		return -1;
 135	}
 136}
 137
 138static int vendor_class_index(u8 mgmt_class)
 139{
 140	return mgmt_class - IB_MGMT_CLASS_VENDOR_RANGE2_START;
 141}
 142
 143static int is_vendor_class(u8 mgmt_class)
 144{
 145	if ((mgmt_class < IB_MGMT_CLASS_VENDOR_RANGE2_START) ||
 146	    (mgmt_class > IB_MGMT_CLASS_VENDOR_RANGE2_END))
 147		return 0;
 148	return 1;
 149}
 150
 151static int is_vendor_oui(char *oui)
 152{
 153	if (oui[0] || oui[1] || oui[2])
 154		return 1;
 155	return 0;
 156}
 157
 158static int is_vendor_method_in_use(
 159		struct ib_mad_mgmt_vendor_class *vendor_class,
 160		struct ib_mad_reg_req *mad_reg_req)
 161{
 162	struct ib_mad_mgmt_method_table *method;
 163	int i;
 164
 165	for (i = 0; i < MAX_MGMT_OUI; i++) {
 166		if (!memcmp(vendor_class->oui[i], mad_reg_req->oui, 3)) {
 167			method = vendor_class->method_table[i];
 168			if (method) {
 169				if (method_in_use(&method, mad_reg_req))
 170					return 1;
 171				else
 172					break;
 173			}
 174		}
 175	}
 176	return 0;
 177}
 178
 179int ib_response_mad(struct ib_mad *mad)
 180{
 181	return ((mad->mad_hdr.method & IB_MGMT_METHOD_RESP) ||
 182		(mad->mad_hdr.method == IB_MGMT_METHOD_TRAP_REPRESS) ||
 183		((mad->mad_hdr.mgmt_class == IB_MGMT_CLASS_BM) &&
 184		 (mad->mad_hdr.attr_mod & IB_BM_ATTR_MOD_RESP)));
 185}
 186EXPORT_SYMBOL(ib_response_mad);
 187
 188/*
 189 * ib_register_mad_agent - Register to send/receive MADs
 
 
 190 */
 191struct ib_mad_agent *ib_register_mad_agent(struct ib_device *device,
 192					   u8 port_num,
 193					   enum ib_qp_type qp_type,
 194					   struct ib_mad_reg_req *mad_reg_req,
 195					   u8 rmpp_version,
 196					   ib_mad_send_handler send_handler,
 197					   ib_mad_recv_handler recv_handler,
 198					   void *context)
 
 199{
 200	struct ib_mad_port_private *port_priv;
 201	struct ib_mad_agent *ret = ERR_PTR(-EINVAL);
 202	struct ib_mad_agent_private *mad_agent_priv;
 203	struct ib_mad_reg_req *reg_req = NULL;
 204	struct ib_mad_mgmt_class_table *class;
 205	struct ib_mad_mgmt_vendor_class_table *vendor;
 206	struct ib_mad_mgmt_vendor_class *vendor_class;
 207	struct ib_mad_mgmt_method_table *method;
 208	int ret2, qpn;
 209	unsigned long flags;
 210	u8 mgmt_class, vclass;
 211
 
 
 
 
 212	/* Validate parameters */
 213	qpn = get_spl_qp_index(qp_type);
 214	if (qpn == -1)
 
 
 215		goto error1;
 
 216
 217	if (rmpp_version && rmpp_version != IB_MGMT_RMPP_VERSION)
 
 
 
 218		goto error1;
 
 219
 220	/* Validate MAD registration request if supplied */
 221	if (mad_reg_req) {
 222		if (mad_reg_req->mgmt_class_version >= MAX_MGMT_VERSION)
 
 
 
 
 223			goto error1;
 224		if (!recv_handler)
 
 
 
 225			goto error1;
 
 226		if (mad_reg_req->mgmt_class >= MAX_MGMT_CLASS) {
 227			/*
 228			 * IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE is the only
 229			 * one in this range currently allowed
 230			 */
 231			if (mad_reg_req->mgmt_class !=
 232			    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)
 
 
 
 233				goto error1;
 
 234		} else if (mad_reg_req->mgmt_class == 0) {
 235			/*
 236			 * Class 0 is reserved in IBA and is used for
 237			 * aliasing of IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE
 238			 */
 
 
 
 239			goto error1;
 240		} else if (is_vendor_class(mad_reg_req->mgmt_class)) {
 241			/*
 242			 * If class is in "new" vendor range,
 243			 * ensure supplied OUI is not zero
 244			 */
 245			if (!is_vendor_oui(mad_reg_req->oui))
 
 
 
 
 246				goto error1;
 
 247		}
 248		/* Make sure class supplied is consistent with RMPP */
 249		if (!ib_is_mad_class_rmpp(mad_reg_req->mgmt_class)) {
 250			if (rmpp_version)
 
 
 
 251				goto error1;
 
 252		}
 
 253		/* Make sure class supplied is consistent with QP type */
 254		if (qp_type == IB_QPT_SMI) {
 255			if ((mad_reg_req->mgmt_class !=
 256					IB_MGMT_CLASS_SUBN_LID_ROUTED) &&
 257			    (mad_reg_req->mgmt_class !=
 258					IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE))
 
 
 
 259				goto error1;
 
 260		} else {
 261			if ((mad_reg_req->mgmt_class ==
 262					IB_MGMT_CLASS_SUBN_LID_ROUTED) ||
 263			    (mad_reg_req->mgmt_class ==
 264					IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE))
 
 
 
 265				goto error1;
 
 266		}
 267	} else {
 268		/* No registration request supplied */
 269		if (!send_handler)
 270			goto error1;
 
 
 271	}
 272
 273	/* Validate device and port */
 274	port_priv = ib_get_mad_port(device, port_num);
 275	if (!port_priv) {
 
 
 276		ret = ERR_PTR(-ENODEV);
 277		goto error1;
 278	}
 279
 280	/* Verify the QP requested is supported.  For example, Ethernet devices
 281	 * will not have QP0 */
 
 282	if (!port_priv->qp_info[qpn].qp) {
 
 
 283		ret = ERR_PTR(-EPROTONOSUPPORT);
 284		goto error1;
 285	}
 286
 287	/* Allocate structures */
 288	mad_agent_priv = kzalloc(sizeof *mad_agent_priv, GFP_KERNEL);
 289	if (!mad_agent_priv) {
 290		ret = ERR_PTR(-ENOMEM);
 291		goto error1;
 292	}
 293
 294	mad_agent_priv->agent.mr = ib_get_dma_mr(port_priv->qp_info[qpn].qp->pd,
 295						 IB_ACCESS_LOCAL_WRITE);
 296	if (IS_ERR(mad_agent_priv->agent.mr)) {
 297		ret = ERR_PTR(-ENOMEM);
 298		goto error2;
 299	}
 300
 301	if (mad_reg_req) {
 302		reg_req = kmemdup(mad_reg_req, sizeof *reg_req, GFP_KERNEL);
 303		if (!reg_req) {
 304			ret = ERR_PTR(-ENOMEM);
 305			goto error3;
 306		}
 307	}
 308
 309	/* Now, fill in the various structures */
 310	mad_agent_priv->qp_info = &port_priv->qp_info[qpn];
 311	mad_agent_priv->reg_req = reg_req;
 312	mad_agent_priv->agent.rmpp_version = rmpp_version;
 313	mad_agent_priv->agent.device = device;
 314	mad_agent_priv->agent.recv_handler = recv_handler;
 315	mad_agent_priv->agent.send_handler = send_handler;
 316	mad_agent_priv->agent.context = context;
 317	mad_agent_priv->agent.qp = port_priv->qp_info[qpn].qp;
 318	mad_agent_priv->agent.port_num = port_num;
 
 319	spin_lock_init(&mad_agent_priv->lock);
 320	INIT_LIST_HEAD(&mad_agent_priv->send_list);
 321	INIT_LIST_HEAD(&mad_agent_priv->wait_list);
 322	INIT_LIST_HEAD(&mad_agent_priv->done_list);
 323	INIT_LIST_HEAD(&mad_agent_priv->rmpp_list);
 324	INIT_DELAYED_WORK(&mad_agent_priv->timed_work, timeout_sends);
 325	INIT_LIST_HEAD(&mad_agent_priv->local_list);
 326	INIT_WORK(&mad_agent_priv->local_work, local_completions);
 327	atomic_set(&mad_agent_priv->refcount, 1);
 328	init_completion(&mad_agent_priv->comp);
 329
 330	spin_lock_irqsave(&port_priv->reg_lock, flags);
 331	mad_agent_priv->agent.hi_tid = ++ib_mad_client_id;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 332
 333	/*
 334	 * Make sure MAD registration (if supplied)
 335	 * is non overlapping with any existing ones
 336	 */
 
 337	if (mad_reg_req) {
 338		mgmt_class = convert_mgmt_class(mad_reg_req->mgmt_class);
 339		if (!is_vendor_class(mgmt_class)) {
 340			class = port_priv->version[mad_reg_req->
 341						   mgmt_class_version].class;
 342			if (class) {
 343				method = class->method_table[mgmt_class];
 344				if (method) {
 345					if (method_in_use(&method,
 346							   mad_reg_req))
 347						goto error4;
 348				}
 349			}
 350			ret2 = add_nonoui_reg_req(mad_reg_req, mad_agent_priv,
 351						  mgmt_class);
 352		} else {
 353			/* "New" vendor class range */
 354			vendor = port_priv->version[mad_reg_req->
 355						    mgmt_class_version].vendor;
 356			if (vendor) {
 357				vclass = vendor_class_index(mgmt_class);
 358				vendor_class = vendor->vendor_class[vclass];
 359				if (vendor_class) {
 360					if (is_vendor_method_in_use(
 361							vendor_class,
 362							mad_reg_req))
 363						goto error4;
 364				}
 365			}
 366			ret2 = add_oui_reg_req(mad_reg_req, mad_agent_priv);
 367		}
 368		if (ret2) {
 369			ret = ERR_PTR(ret2);
 370			goto error4;
 371		}
 372	}
 
 373
 374	/* Add mad agent into port's agent list */
 375	list_add_tail(&mad_agent_priv->agent_list, &port_priv->agent_list);
 376	spin_unlock_irqrestore(&port_priv->reg_lock, flags);
 377
 378	return &mad_agent_priv->agent;
 379
 
 
 
 
 380error4:
 381	spin_unlock_irqrestore(&port_priv->reg_lock, flags);
 382	kfree(reg_req);
 383error3:
 384	ib_dereg_mr(mad_agent_priv->agent.mr);
 385error2:
 386	kfree(mad_agent_priv);
 387error1:
 388	return ret;
 389}
 390EXPORT_SYMBOL(ib_register_mad_agent);
 391
 392static inline int is_snooping_sends(int mad_snoop_flags)
 393{
 394	return (mad_snoop_flags &
 395		(/*IB_MAD_SNOOP_POSTED_SENDS |
 396		 IB_MAD_SNOOP_RMPP_SENDS |*/
 397		 IB_MAD_SNOOP_SEND_COMPLETIONS /*|
 398		 IB_MAD_SNOOP_RMPP_SEND_COMPLETIONS*/));
 399}
 400
 401static inline int is_snooping_recvs(int mad_snoop_flags)
 402{
 403	return (mad_snoop_flags &
 404		(IB_MAD_SNOOP_RECVS /*|
 405		 IB_MAD_SNOOP_RMPP_RECVS*/));
 406}
 407
 408static int register_snoop_agent(struct ib_mad_qp_info *qp_info,
 409				struct ib_mad_snoop_private *mad_snoop_priv)
 410{
 411	struct ib_mad_snoop_private **new_snoop_table;
 412	unsigned long flags;
 413	int i;
 414
 415	spin_lock_irqsave(&qp_info->snoop_lock, flags);
 416	/* Check for empty slot in array. */
 417	for (i = 0; i < qp_info->snoop_table_size; i++)
 418		if (!qp_info->snoop_table[i])
 419			break;
 420
 421	if (i == qp_info->snoop_table_size) {
 422		/* Grow table. */
 423		new_snoop_table = krealloc(qp_info->snoop_table,
 424					   sizeof mad_snoop_priv *
 425					   (qp_info->snoop_table_size + 1),
 426					   GFP_ATOMIC);
 427		if (!new_snoop_table) {
 428			i = -ENOMEM;
 429			goto out;
 430		}
 431
 432		qp_info->snoop_table = new_snoop_table;
 433		qp_info->snoop_table_size++;
 434	}
 435	qp_info->snoop_table[i] = mad_snoop_priv;
 436	atomic_inc(&qp_info->snoop_count);
 437out:
 438	spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 439	return i;
 440}
 441
 442struct ib_mad_agent *ib_register_mad_snoop(struct ib_device *device,
 443					   u8 port_num,
 444					   enum ib_qp_type qp_type,
 445					   int mad_snoop_flags,
 446					   ib_mad_snoop_handler snoop_handler,
 447					   ib_mad_recv_handler recv_handler,
 448					   void *context)
 449{
 450	struct ib_mad_port_private *port_priv;
 451	struct ib_mad_agent *ret;
 452	struct ib_mad_snoop_private *mad_snoop_priv;
 453	int qpn;
 454
 455	/* Validate parameters */
 456	if ((is_snooping_sends(mad_snoop_flags) && !snoop_handler) ||
 457	    (is_snooping_recvs(mad_snoop_flags) && !recv_handler)) {
 458		ret = ERR_PTR(-EINVAL);
 459		goto error1;
 460	}
 461	qpn = get_spl_qp_index(qp_type);
 462	if (qpn == -1) {
 463		ret = ERR_PTR(-EINVAL);
 464		goto error1;
 465	}
 466	port_priv = ib_get_mad_port(device, port_num);
 467	if (!port_priv) {
 468		ret = ERR_PTR(-ENODEV);
 469		goto error1;
 470	}
 471	/* Allocate structures */
 472	mad_snoop_priv = kzalloc(sizeof *mad_snoop_priv, GFP_KERNEL);
 473	if (!mad_snoop_priv) {
 474		ret = ERR_PTR(-ENOMEM);
 475		goto error1;
 476	}
 477
 478	/* Now, fill in the various structures */
 479	mad_snoop_priv->qp_info = &port_priv->qp_info[qpn];
 480	mad_snoop_priv->agent.device = device;
 481	mad_snoop_priv->agent.recv_handler = recv_handler;
 482	mad_snoop_priv->agent.snoop_handler = snoop_handler;
 483	mad_snoop_priv->agent.context = context;
 484	mad_snoop_priv->agent.qp = port_priv->qp_info[qpn].qp;
 485	mad_snoop_priv->agent.port_num = port_num;
 486	mad_snoop_priv->mad_snoop_flags = mad_snoop_flags;
 487	init_completion(&mad_snoop_priv->comp);
 488	mad_snoop_priv->snoop_index = register_snoop_agent(
 489						&port_priv->qp_info[qpn],
 490						mad_snoop_priv);
 491	if (mad_snoop_priv->snoop_index < 0) {
 492		ret = ERR_PTR(mad_snoop_priv->snoop_index);
 493		goto error2;
 494	}
 495
 496	atomic_set(&mad_snoop_priv->refcount, 1);
 497	return &mad_snoop_priv->agent;
 498
 499error2:
 500	kfree(mad_snoop_priv);
 501error1:
 502	return ret;
 503}
 504EXPORT_SYMBOL(ib_register_mad_snoop);
 505
 506static inline void deref_mad_agent(struct ib_mad_agent_private *mad_agent_priv)
 507{
 508	if (atomic_dec_and_test(&mad_agent_priv->refcount))
 509		complete(&mad_agent_priv->comp);
 510}
 511
 512static inline void deref_snoop_agent(struct ib_mad_snoop_private *mad_snoop_priv)
 513{
 514	if (atomic_dec_and_test(&mad_snoop_priv->refcount))
 515		complete(&mad_snoop_priv->comp);
 516}
 517
 518static void unregister_mad_agent(struct ib_mad_agent_private *mad_agent_priv)
 519{
 520	struct ib_mad_port_private *port_priv;
 521	unsigned long flags;
 522
 523	/* Note that we could still be handling received MADs */
 
 524
 525	/*
 526	 * Canceling all sends results in dropping received response
 527	 * MADs, preventing us from queuing additional work
 528	 */
 529	cancel_mads(mad_agent_priv);
 530	port_priv = mad_agent_priv->qp_info->port_priv;
 531	cancel_delayed_work(&mad_agent_priv->timed_work);
 532
 533	spin_lock_irqsave(&port_priv->reg_lock, flags);
 534	remove_mad_reg_req(mad_agent_priv);
 535	list_del(&mad_agent_priv->agent_list);
 536	spin_unlock_irqrestore(&port_priv->reg_lock, flags);
 537
 538	flush_workqueue(port_priv->wq);
 539	ib_cancel_rmpp_recvs(mad_agent_priv);
 540
 541	deref_mad_agent(mad_agent_priv);
 542	wait_for_completion(&mad_agent_priv->comp);
 
 
 
 543
 544	kfree(mad_agent_priv->reg_req);
 545	ib_dereg_mr(mad_agent_priv->agent.mr);
 546	kfree(mad_agent_priv);
 547}
 548
 549static void unregister_mad_snoop(struct ib_mad_snoop_private *mad_snoop_priv)
 550{
 551	struct ib_mad_qp_info *qp_info;
 552	unsigned long flags;
 553
 554	qp_info = mad_snoop_priv->qp_info;
 555	spin_lock_irqsave(&qp_info->snoop_lock, flags);
 556	qp_info->snoop_table[mad_snoop_priv->snoop_index] = NULL;
 557	atomic_dec(&qp_info->snoop_count);
 558	spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 559
 560	deref_snoop_agent(mad_snoop_priv);
 561	wait_for_completion(&mad_snoop_priv->comp);
 562
 563	kfree(mad_snoop_priv);
 564}
 565
 566/*
 567 * ib_unregister_mad_agent - Unregisters a client from using MAD services
 
 
 568 */
 569int ib_unregister_mad_agent(struct ib_mad_agent *mad_agent)
 570{
 571	struct ib_mad_agent_private *mad_agent_priv;
 572	struct ib_mad_snoop_private *mad_snoop_priv;
 573
 574	/* If the TID is zero, the agent can only snoop. */
 575	if (mad_agent->hi_tid) {
 576		mad_agent_priv = container_of(mad_agent,
 577					      struct ib_mad_agent_private,
 578					      agent);
 579		unregister_mad_agent(mad_agent_priv);
 580	} else {
 581		mad_snoop_priv = container_of(mad_agent,
 582					      struct ib_mad_snoop_private,
 583					      agent);
 584		unregister_mad_snoop(mad_snoop_priv);
 585	}
 586	return 0;
 587}
 588EXPORT_SYMBOL(ib_unregister_mad_agent);
 589
 590static void dequeue_mad(struct ib_mad_list_head *mad_list)
 591{
 592	struct ib_mad_queue *mad_queue;
 593	unsigned long flags;
 594
 595	BUG_ON(!mad_list->mad_queue);
 596	mad_queue = mad_list->mad_queue;
 597	spin_lock_irqsave(&mad_queue->lock, flags);
 598	list_del(&mad_list->list);
 599	mad_queue->count--;
 600	spin_unlock_irqrestore(&mad_queue->lock, flags);
 601}
 602
 603static void snoop_send(struct ib_mad_qp_info *qp_info,
 604		       struct ib_mad_send_buf *send_buf,
 605		       struct ib_mad_send_wc *mad_send_wc,
 606		       int mad_snoop_flags)
 607{
 608	struct ib_mad_snoop_private *mad_snoop_priv;
 609	unsigned long flags;
 610	int i;
 611
 612	spin_lock_irqsave(&qp_info->snoop_lock, flags);
 613	for (i = 0; i < qp_info->snoop_table_size; i++) {
 614		mad_snoop_priv = qp_info->snoop_table[i];
 615		if (!mad_snoop_priv ||
 616		    !(mad_snoop_priv->mad_snoop_flags & mad_snoop_flags))
 617			continue;
 618
 619		atomic_inc(&mad_snoop_priv->refcount);
 620		spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 621		mad_snoop_priv->agent.snoop_handler(&mad_snoop_priv->agent,
 622						    send_buf, mad_send_wc);
 623		deref_snoop_agent(mad_snoop_priv);
 624		spin_lock_irqsave(&qp_info->snoop_lock, flags);
 625	}
 626	spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 627}
 628
 629static void snoop_recv(struct ib_mad_qp_info *qp_info,
 630		       struct ib_mad_recv_wc *mad_recv_wc,
 631		       int mad_snoop_flags)
 632{
 633	struct ib_mad_snoop_private *mad_snoop_priv;
 634	unsigned long flags;
 635	int i;
 636
 637	spin_lock_irqsave(&qp_info->snoop_lock, flags);
 638	for (i = 0; i < qp_info->snoop_table_size; i++) {
 639		mad_snoop_priv = qp_info->snoop_table[i];
 640		if (!mad_snoop_priv ||
 641		    !(mad_snoop_priv->mad_snoop_flags & mad_snoop_flags))
 642			continue;
 643
 644		atomic_inc(&mad_snoop_priv->refcount);
 645		spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 646		mad_snoop_priv->agent.recv_handler(&mad_snoop_priv->agent,
 647						   mad_recv_wc);
 648		deref_snoop_agent(mad_snoop_priv);
 649		spin_lock_irqsave(&qp_info->snoop_lock, flags);
 650	}
 651	spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 652}
 653
 654static void build_smp_wc(struct ib_qp *qp,
 655			 u64 wr_id, u16 slid, u16 pkey_index, u8 port_num,
 656			 struct ib_wc *wc)
 657{
 658	memset(wc, 0, sizeof *wc);
 659	wc->wr_id = wr_id;
 660	wc->status = IB_WC_SUCCESS;
 661	wc->opcode = IB_WC_RECV;
 662	wc->pkey_index = pkey_index;
 663	wc->byte_len = sizeof(struct ib_mad) + sizeof(struct ib_grh);
 664	wc->src_qp = IB_QP0;
 665	wc->qp = qp;
 666	wc->slid = slid;
 667	wc->sl = 0;
 668	wc->dlid_path_bits = 0;
 669	wc->port_num = port_num;
 670}
 671
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 672/*
 673 * Return 0 if SMP is to be sent
 674 * Return 1 if SMP was consumed locally (whether or not solicited)
 675 * Return < 0 if error
 676 */
 677static int handle_outgoing_dr_smp(struct ib_mad_agent_private *mad_agent_priv,
 678				  struct ib_mad_send_wr_private *mad_send_wr)
 679{
 680	int ret = 0;
 681	struct ib_smp *smp = mad_send_wr->send_buf.mad;
 
 682	unsigned long flags;
 683	struct ib_mad_local_private *local;
 684	struct ib_mad_private *mad_priv;
 685	struct ib_mad_port_private *port_priv;
 686	struct ib_mad_agent_private *recv_mad_agent = NULL;
 687	struct ib_device *device = mad_agent_priv->agent.device;
 688	u8 port_num;
 689	struct ib_wc mad_wc;
 690	struct ib_send_wr *send_wr = &mad_send_wr->send_wr;
 
 
 
 
 
 691
 692	if (device->node_type == RDMA_NODE_IB_SWITCH &&
 693	    smp->mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)
 694		port_num = send_wr->wr.ud.port_num;
 695	else
 696		port_num = mad_agent_priv->agent.port_num;
 697
 698	/*
 699	 * Directed route handling starts if the initial LID routed part of
 700	 * a request or the ending LID routed part of a response is empty.
 701	 * If we are at the start of the LID routed part, don't update the
 702	 * hop_ptr or hop_cnt.  See section 14.2.2, Vol 1 IB spec.
 703	 */
 704	if ((ib_get_smp_direction(smp) ? smp->dr_dlid : smp->dr_slid) ==
 705	     IB_LID_PERMISSIVE &&
 706	     smi_handle_dr_smp_send(smp, device->node_type, port_num) ==
 707	     IB_SMI_DISCARD) {
 708		ret = -EINVAL;
 709		printk(KERN_ERR PFX "Invalid directed route\n");
 710		goto out;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 711	}
 712
 713	/* Check to post send on QP or process locally */
 714	if (smi_check_local_smp(smp, device) == IB_SMI_DISCARD &&
 715	    smi_check_local_returning_smp(smp, device) == IB_SMI_DISCARD)
 716		goto out;
 717
 718	local = kmalloc(sizeof *local, GFP_ATOMIC);
 719	if (!local) {
 720		ret = -ENOMEM;
 721		printk(KERN_ERR PFX "No memory for ib_mad_local_private\n");
 722		goto out;
 723	}
 724	local->mad_priv = NULL;
 725	local->recv_mad_agent = NULL;
 726	mad_priv = kmem_cache_alloc(ib_mad_cache, GFP_ATOMIC);
 727	if (!mad_priv) {
 728		ret = -ENOMEM;
 729		printk(KERN_ERR PFX "No memory for local response MAD\n");
 730		kfree(local);
 731		goto out;
 732	}
 733
 734	build_smp_wc(mad_agent_priv->agent.qp,
 735		     send_wr->wr_id, be16_to_cpu(smp->dr_slid),
 736		     send_wr->wr.ud.pkey_index,
 737		     send_wr->wr.ud.port_num, &mad_wc);
 
 
 
 
 
 
 738
 739	/* No GRH for DR SMP */
 740	ret = device->process_mad(device, 0, port_num, &mad_wc, NULL,
 741				  (struct ib_mad *)smp,
 742				  (struct ib_mad *)&mad_priv->mad);
 743	switch (ret)
 744	{
 745	case IB_MAD_RESULT_SUCCESS | IB_MAD_RESULT_REPLY:
 746		if (ib_response_mad(&mad_priv->mad.mad) &&
 747		    mad_agent_priv->agent.recv_handler) {
 748			local->mad_priv = mad_priv;
 749			local->recv_mad_agent = mad_agent_priv;
 750			/*
 751			 * Reference MAD agent until receive
 752			 * side of local completion handled
 753			 */
 754			atomic_inc(&mad_agent_priv->refcount);
 755		} else
 756			kmem_cache_free(ib_mad_cache, mad_priv);
 757		break;
 758	case IB_MAD_RESULT_SUCCESS | IB_MAD_RESULT_CONSUMED:
 759		kmem_cache_free(ib_mad_cache, mad_priv);
 760		break;
 761	case IB_MAD_RESULT_SUCCESS:
 762		/* Treat like an incoming receive MAD */
 763		port_priv = ib_get_mad_port(mad_agent_priv->agent.device,
 764					    mad_agent_priv->agent.port_num);
 765		if (port_priv) {
 766			memcpy(&mad_priv->mad.mad, smp, sizeof(struct ib_mad));
 767			recv_mad_agent = find_mad_agent(port_priv,
 768						        &mad_priv->mad.mad);
 769		}
 770		if (!port_priv || !recv_mad_agent) {
 771			/*
 772			 * No receiving agent so drop packet and
 773			 * generate send completion.
 774			 */
 775			kmem_cache_free(ib_mad_cache, mad_priv);
 776			break;
 777		}
 778		local->mad_priv = mad_priv;
 779		local->recv_mad_agent = recv_mad_agent;
 780		break;
 781	default:
 782		kmem_cache_free(ib_mad_cache, mad_priv);
 783		kfree(local);
 784		ret = -EINVAL;
 785		goto out;
 786	}
 787
 788	local->mad_send_wr = mad_send_wr;
 
 
 
 
 789	/* Reference MAD agent until send side of local completion handled */
 790	atomic_inc(&mad_agent_priv->refcount);
 791	/* Queue local completion to local list */
 792	spin_lock_irqsave(&mad_agent_priv->lock, flags);
 793	list_add_tail(&local->completion_list, &mad_agent_priv->local_list);
 794	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
 795	queue_work(mad_agent_priv->qp_info->port_priv->wq,
 796		   &mad_agent_priv->local_work);
 797	ret = 1;
 798out:
 799	return ret;
 800}
 801
 802static int get_pad_size(int hdr_len, int data_len)
 803{
 804	int seg_size, pad;
 805
 806	seg_size = sizeof(struct ib_mad) - hdr_len;
 807	if (data_len && seg_size) {
 808		pad = seg_size - data_len % seg_size;
 809		return pad == seg_size ? 0 : pad;
 810	} else
 811		return seg_size;
 812}
 813
 814static void free_send_rmpp_list(struct ib_mad_send_wr_private *mad_send_wr)
 815{
 816	struct ib_rmpp_segment *s, *t;
 817
 818	list_for_each_entry_safe(s, t, &mad_send_wr->rmpp_list, list) {
 819		list_del(&s->list);
 820		kfree(s);
 821	}
 822}
 823
 824static int alloc_send_rmpp_list(struct ib_mad_send_wr_private *send_wr,
 825				gfp_t gfp_mask)
 826{
 827	struct ib_mad_send_buf *send_buf = &send_wr->send_buf;
 828	struct ib_rmpp_mad *rmpp_mad = send_buf->mad;
 829	struct ib_rmpp_segment *seg = NULL;
 830	int left, seg_size, pad;
 831
 832	send_buf->seg_size = sizeof (struct ib_mad) - send_buf->hdr_len;
 
 833	seg_size = send_buf->seg_size;
 834	pad = send_wr->pad;
 835
 836	/* Allocate data segments. */
 837	for (left = send_buf->data_len + pad; left > 0; left -= seg_size) {
 838		seg = kmalloc(sizeof (*seg) + seg_size, gfp_mask);
 839		if (!seg) {
 840			printk(KERN_ERR "alloc_send_rmpp_segs: RMPP mem "
 841			       "alloc failed for len %zd, gfp %#x\n",
 842			       sizeof (*seg) + seg_size, gfp_mask);
 843			free_send_rmpp_list(send_wr);
 844			return -ENOMEM;
 845		}
 846		seg->num = ++send_buf->seg_count;
 847		list_add_tail(&seg->list, &send_wr->rmpp_list);
 848	}
 849
 850	/* Zero any padding */
 851	if (pad)
 852		memset(seg->data + seg_size - pad, 0, pad);
 853
 854	rmpp_mad->rmpp_hdr.rmpp_version = send_wr->mad_agent_priv->
 855					  agent.rmpp_version;
 856	rmpp_mad->rmpp_hdr.rmpp_type = IB_MGMT_RMPP_TYPE_DATA;
 857	ib_set_rmpp_flags(&rmpp_mad->rmpp_hdr, IB_MGMT_RMPP_FLAG_ACTIVE);
 858
 859	send_wr->cur_seg = container_of(send_wr->rmpp_list.next,
 860					struct ib_rmpp_segment, list);
 861	send_wr->last_ack_seg = send_wr->cur_seg;
 862	return 0;
 863}
 864
 865struct ib_mad_send_buf * ib_create_send_mad(struct ib_mad_agent *mad_agent,
 866					    u32 remote_qpn, u16 pkey_index,
 867					    int rmpp_active,
 868					    int hdr_len, int data_len,
 869					    gfp_t gfp_mask)
 
 
 
 
 
 
 870{
 871	struct ib_mad_agent_private *mad_agent_priv;
 872	struct ib_mad_send_wr_private *mad_send_wr;
 873	int pad, message_size, ret, size;
 874	void *buf;
 
 
 875
 876	mad_agent_priv = container_of(mad_agent, struct ib_mad_agent_private,
 877				      agent);
 878	pad = get_pad_size(hdr_len, data_len);
 
 
 
 
 
 
 
 
 879	message_size = hdr_len + data_len + pad;
 880
 881	if ((!mad_agent->rmpp_version &&
 882	     (rmpp_active || message_size > sizeof(struct ib_mad))) ||
 883	    (!rmpp_active && message_size > sizeof(struct ib_mad)))
 884		return ERR_PTR(-EINVAL);
 
 
 885
 886	size = rmpp_active ? hdr_len : sizeof(struct ib_mad);
 887	buf = kzalloc(sizeof *mad_send_wr + size, gfp_mask);
 888	if (!buf)
 889		return ERR_PTR(-ENOMEM);
 890
 891	mad_send_wr = buf + size;
 892	INIT_LIST_HEAD(&mad_send_wr->rmpp_list);
 893	mad_send_wr->send_buf.mad = buf;
 894	mad_send_wr->send_buf.hdr_len = hdr_len;
 895	mad_send_wr->send_buf.data_len = data_len;
 896	mad_send_wr->pad = pad;
 897
 898	mad_send_wr->mad_agent_priv = mad_agent_priv;
 899	mad_send_wr->sg_list[0].length = hdr_len;
 900	mad_send_wr->sg_list[0].lkey = mad_agent->mr->lkey;
 901	mad_send_wr->sg_list[1].length = sizeof(struct ib_mad) - hdr_len;
 902	mad_send_wr->sg_list[1].lkey = mad_agent->mr->lkey;
 903
 904	mad_send_wr->send_wr.wr_id = (unsigned long) mad_send_wr;
 905	mad_send_wr->send_wr.sg_list = mad_send_wr->sg_list;
 906	mad_send_wr->send_wr.num_sge = 2;
 907	mad_send_wr->send_wr.opcode = IB_WR_SEND;
 908	mad_send_wr->send_wr.send_flags = IB_SEND_SIGNALED;
 909	mad_send_wr->send_wr.wr.ud.remote_qpn = remote_qpn;
 910	mad_send_wr->send_wr.wr.ud.remote_qkey = IB_QP_SET_QKEY;
 911	mad_send_wr->send_wr.wr.ud.pkey_index = pkey_index;
 
 
 
 
 
 
 
 
 
 912
 913	if (rmpp_active) {
 914		ret = alloc_send_rmpp_list(mad_send_wr, gfp_mask);
 915		if (ret) {
 916			kfree(buf);
 917			return ERR_PTR(ret);
 918		}
 919	}
 920
 921	mad_send_wr->send_buf.mad_agent = mad_agent;
 922	atomic_inc(&mad_agent_priv->refcount);
 923	return &mad_send_wr->send_buf;
 924}
 925EXPORT_SYMBOL(ib_create_send_mad);
 926
 927int ib_get_mad_data_offset(u8 mgmt_class)
 928{
 929	if (mgmt_class == IB_MGMT_CLASS_SUBN_ADM)
 930		return IB_MGMT_SA_HDR;
 931	else if ((mgmt_class == IB_MGMT_CLASS_DEVICE_MGMT) ||
 932		 (mgmt_class == IB_MGMT_CLASS_DEVICE_ADM) ||
 933		 (mgmt_class == IB_MGMT_CLASS_BIS))
 934		return IB_MGMT_DEVICE_HDR;
 935	else if ((mgmt_class >= IB_MGMT_CLASS_VENDOR_RANGE2_START) &&
 936		 (mgmt_class <= IB_MGMT_CLASS_VENDOR_RANGE2_END))
 937		return IB_MGMT_VENDOR_HDR;
 938	else
 939		return IB_MGMT_MAD_HDR;
 940}
 941EXPORT_SYMBOL(ib_get_mad_data_offset);
 942
 943int ib_is_mad_class_rmpp(u8 mgmt_class)
 944{
 945	if ((mgmt_class == IB_MGMT_CLASS_SUBN_ADM) ||
 946	    (mgmt_class == IB_MGMT_CLASS_DEVICE_MGMT) ||
 947	    (mgmt_class == IB_MGMT_CLASS_DEVICE_ADM) ||
 948	    (mgmt_class == IB_MGMT_CLASS_BIS) ||
 949	    ((mgmt_class >= IB_MGMT_CLASS_VENDOR_RANGE2_START) &&
 950	     (mgmt_class <= IB_MGMT_CLASS_VENDOR_RANGE2_END)))
 951		return 1;
 952	return 0;
 953}
 954EXPORT_SYMBOL(ib_is_mad_class_rmpp);
 955
 956void *ib_get_rmpp_segment(struct ib_mad_send_buf *send_buf, int seg_num)
 957{
 958	struct ib_mad_send_wr_private *mad_send_wr;
 959	struct list_head *list;
 960
 961	mad_send_wr = container_of(send_buf, struct ib_mad_send_wr_private,
 962				   send_buf);
 963	list = &mad_send_wr->cur_seg->list;
 964
 965	if (mad_send_wr->cur_seg->num < seg_num) {
 966		list_for_each_entry(mad_send_wr->cur_seg, list, list)
 967			if (mad_send_wr->cur_seg->num == seg_num)
 968				break;
 969	} else if (mad_send_wr->cur_seg->num > seg_num) {
 970		list_for_each_entry_reverse(mad_send_wr->cur_seg, list, list)
 971			if (mad_send_wr->cur_seg->num == seg_num)
 972				break;
 973	}
 974	return mad_send_wr->cur_seg->data;
 975}
 976EXPORT_SYMBOL(ib_get_rmpp_segment);
 977
 978static inline void *ib_get_payload(struct ib_mad_send_wr_private *mad_send_wr)
 979{
 980	if (mad_send_wr->send_buf.seg_count)
 981		return ib_get_rmpp_segment(&mad_send_wr->send_buf,
 982					   mad_send_wr->seg_num);
 983	else
 984		return mad_send_wr->send_buf.mad +
 985		       mad_send_wr->send_buf.hdr_len;
 986}
 987
 988void ib_free_send_mad(struct ib_mad_send_buf *send_buf)
 989{
 990	struct ib_mad_agent_private *mad_agent_priv;
 991	struct ib_mad_send_wr_private *mad_send_wr;
 992
 993	mad_agent_priv = container_of(send_buf->mad_agent,
 994				      struct ib_mad_agent_private, agent);
 995	mad_send_wr = container_of(send_buf, struct ib_mad_send_wr_private,
 996				   send_buf);
 997
 998	free_send_rmpp_list(mad_send_wr);
 999	kfree(send_buf->mad);
1000	deref_mad_agent(mad_agent_priv);
1001}
1002EXPORT_SYMBOL(ib_free_send_mad);
1003
1004int ib_send_mad(struct ib_mad_send_wr_private *mad_send_wr)
1005{
1006	struct ib_mad_qp_info *qp_info;
1007	struct list_head *list;
1008	struct ib_send_wr *bad_send_wr;
1009	struct ib_mad_agent *mad_agent;
1010	struct ib_sge *sge;
1011	unsigned long flags;
1012	int ret;
1013
1014	/* Set WR ID to find mad_send_wr upon completion */
1015	qp_info = mad_send_wr->mad_agent_priv->qp_info;
1016	mad_send_wr->send_wr.wr_id = (unsigned long)&mad_send_wr->mad_list;
1017	mad_send_wr->mad_list.mad_queue = &qp_info->send_queue;
 
 
1018
1019	mad_agent = mad_send_wr->send_buf.mad_agent;
1020	sge = mad_send_wr->sg_list;
1021	sge[0].addr = ib_dma_map_single(mad_agent->device,
1022					mad_send_wr->send_buf.mad,
1023					sge[0].length,
1024					DMA_TO_DEVICE);
 
 
 
1025	mad_send_wr->header_mapping = sge[0].addr;
1026
1027	sge[1].addr = ib_dma_map_single(mad_agent->device,
1028					ib_get_payload(mad_send_wr),
1029					sge[1].length,
1030					DMA_TO_DEVICE);
 
 
 
 
 
 
1031	mad_send_wr->payload_mapping = sge[1].addr;
1032
1033	spin_lock_irqsave(&qp_info->send_queue.lock, flags);
1034	if (qp_info->send_queue.count < qp_info->send_queue.max_active) {
1035		ret = ib_post_send(mad_agent->qp, &mad_send_wr->send_wr,
1036				   &bad_send_wr);
 
1037		list = &qp_info->send_queue.list;
1038	} else {
1039		ret = 0;
1040		list = &qp_info->overflow_list;
1041	}
1042
1043	if (!ret) {
1044		qp_info->send_queue.count++;
1045		list_add_tail(&mad_send_wr->mad_list.list, list);
1046	}
1047	spin_unlock_irqrestore(&qp_info->send_queue.lock, flags);
1048	if (ret) {
1049		ib_dma_unmap_single(mad_agent->device,
1050				    mad_send_wr->header_mapping,
1051				    sge[0].length, DMA_TO_DEVICE);
1052		ib_dma_unmap_single(mad_agent->device,
1053				    mad_send_wr->payload_mapping,
1054				    sge[1].length, DMA_TO_DEVICE);
1055	}
1056	return ret;
1057}
1058
1059/*
1060 * ib_post_send_mad - Posts MAD(s) to the send queue of the QP associated
1061 *  with the registered client
1062 */
1063int ib_post_send_mad(struct ib_mad_send_buf *send_buf,
1064		     struct ib_mad_send_buf **bad_send_buf)
1065{
1066	struct ib_mad_agent_private *mad_agent_priv;
1067	struct ib_mad_send_buf *next_send_buf;
1068	struct ib_mad_send_wr_private *mad_send_wr;
1069	unsigned long flags;
1070	int ret = -EINVAL;
1071
1072	/* Walk list of send WRs and post each on send list */
1073	for (; send_buf; send_buf = next_send_buf) {
1074
1075		mad_send_wr = container_of(send_buf,
1076					   struct ib_mad_send_wr_private,
1077					   send_buf);
1078		mad_agent_priv = mad_send_wr->mad_agent_priv;
1079
 
 
 
 
 
1080		if (!send_buf->mad_agent->send_handler ||
1081		    (send_buf->timeout_ms &&
1082		     !send_buf->mad_agent->recv_handler)) {
1083			ret = -EINVAL;
1084			goto error;
1085		}
1086
1087		if (!ib_is_mad_class_rmpp(((struct ib_mad_hdr *) send_buf->mad)->mgmt_class)) {
1088			if (mad_agent_priv->agent.rmpp_version) {
1089				ret = -EINVAL;
1090				goto error;
1091			}
1092		}
1093
1094		/*
1095		 * Save pointer to next work request to post in case the
1096		 * current one completes, and the user modifies the work
1097		 * request associated with the completion
1098		 */
1099		next_send_buf = send_buf->next;
1100		mad_send_wr->send_wr.wr.ud.ah = send_buf->ah;
1101
1102		if (((struct ib_mad_hdr *) send_buf->mad)->mgmt_class ==
1103		    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE) {
1104			ret = handle_outgoing_dr_smp(mad_agent_priv,
1105						     mad_send_wr);
1106			if (ret < 0)		/* error */
1107				goto error;
1108			else if (ret == 1)	/* locally consumed */
1109				continue;
1110		}
1111
1112		mad_send_wr->tid = ((struct ib_mad_hdr *) send_buf->mad)->tid;
1113		/* Timeout will be updated after send completes */
1114		mad_send_wr->timeout = msecs_to_jiffies(send_buf->timeout_ms);
1115		mad_send_wr->max_retries = send_buf->retries;
1116		mad_send_wr->retries_left = send_buf->retries;
1117		send_buf->retries = 0;
1118		/* Reference for work request to QP + response */
1119		mad_send_wr->refcount = 1 + (mad_send_wr->timeout > 0);
1120		mad_send_wr->status = IB_WC_SUCCESS;
1121
1122		/* Reference MAD agent until send completes */
1123		atomic_inc(&mad_agent_priv->refcount);
1124		spin_lock_irqsave(&mad_agent_priv->lock, flags);
1125		list_add_tail(&mad_send_wr->agent_list,
1126			      &mad_agent_priv->send_list);
1127		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1128
1129		if (mad_agent_priv->agent.rmpp_version) {
1130			ret = ib_send_rmpp_mad(mad_send_wr);
1131			if (ret >= 0 && ret != IB_RMPP_RESULT_CONSUMED)
1132				ret = ib_send_mad(mad_send_wr);
1133		} else
1134			ret = ib_send_mad(mad_send_wr);
1135		if (ret < 0) {
1136			/* Fail send request */
1137			spin_lock_irqsave(&mad_agent_priv->lock, flags);
1138			list_del(&mad_send_wr->agent_list);
1139			spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1140			atomic_dec(&mad_agent_priv->refcount);
1141			goto error;
1142		}
1143	}
1144	return 0;
1145error:
1146	if (bad_send_buf)
1147		*bad_send_buf = send_buf;
1148	return ret;
1149}
1150EXPORT_SYMBOL(ib_post_send_mad);
1151
1152/*
1153 * ib_free_recv_mad - Returns data buffers used to receive
1154 *  a MAD to the access layer
1155 */
1156void ib_free_recv_mad(struct ib_mad_recv_wc *mad_recv_wc)
1157{
1158	struct ib_mad_recv_buf *mad_recv_buf, *temp_recv_buf;
1159	struct ib_mad_private_header *mad_priv_hdr;
1160	struct ib_mad_private *priv;
1161	struct list_head free_list;
1162
1163	INIT_LIST_HEAD(&free_list);
1164	list_splice_init(&mad_recv_wc->rmpp_list, &free_list);
1165
1166	list_for_each_entry_safe(mad_recv_buf, temp_recv_buf,
1167					&free_list, list) {
1168		mad_recv_wc = container_of(mad_recv_buf, struct ib_mad_recv_wc,
1169					   recv_buf);
1170		mad_priv_hdr = container_of(mad_recv_wc,
1171					    struct ib_mad_private_header,
1172					    recv_wc);
1173		priv = container_of(mad_priv_hdr, struct ib_mad_private,
1174				    header);
1175		kmem_cache_free(ib_mad_cache, priv);
1176	}
1177}
1178EXPORT_SYMBOL(ib_free_recv_mad);
1179
1180struct ib_mad_agent *ib_redirect_mad_qp(struct ib_qp *qp,
1181					u8 rmpp_version,
1182					ib_mad_send_handler send_handler,
1183					ib_mad_recv_handler recv_handler,
1184					void *context)
1185{
1186	return ERR_PTR(-EINVAL);	/* XXX: for now */
1187}
1188EXPORT_SYMBOL(ib_redirect_mad_qp);
1189
1190int ib_process_mad_wc(struct ib_mad_agent *mad_agent,
1191		      struct ib_wc *wc)
1192{
1193	printk(KERN_ERR PFX "ib_process_mad_wc() not implemented yet\n");
1194	return 0;
1195}
1196EXPORT_SYMBOL(ib_process_mad_wc);
1197
1198static int method_in_use(struct ib_mad_mgmt_method_table **method,
1199			 struct ib_mad_reg_req *mad_reg_req)
1200{
1201	int i;
1202
1203	for_each_set_bit(i, mad_reg_req->method_mask, IB_MGMT_MAX_METHODS) {
1204		if ((*method)->agent[i]) {
1205			printk(KERN_ERR PFX "Method %d already in use\n", i);
1206			return -EINVAL;
1207		}
1208	}
1209	return 0;
1210}
1211
1212static int allocate_method_table(struct ib_mad_mgmt_method_table **method)
1213{
1214	/* Allocate management method table */
1215	*method = kzalloc(sizeof **method, GFP_ATOMIC);
1216	if (!*method) {
1217		printk(KERN_ERR PFX "No memory for "
1218		       "ib_mad_mgmt_method_table\n");
1219		return -ENOMEM;
1220	}
1221
1222	return 0;
1223}
1224
1225/*
1226 * Check to see if there are any methods still in use
1227 */
1228static int check_method_table(struct ib_mad_mgmt_method_table *method)
1229{
1230	int i;
1231
1232	for (i = 0; i < IB_MGMT_MAX_METHODS; i++)
1233		if (method->agent[i])
1234			return 1;
1235	return 0;
1236}
1237
1238/*
1239 * Check to see if there are any method tables for this class still in use
1240 */
1241static int check_class_table(struct ib_mad_mgmt_class_table *class)
1242{
1243	int i;
1244
1245	for (i = 0; i < MAX_MGMT_CLASS; i++)
1246		if (class->method_table[i])
1247			return 1;
1248	return 0;
1249}
1250
1251static int check_vendor_class(struct ib_mad_mgmt_vendor_class *vendor_class)
1252{
1253	int i;
1254
1255	for (i = 0; i < MAX_MGMT_OUI; i++)
1256		if (vendor_class->method_table[i])
1257			return 1;
1258	return 0;
1259}
1260
1261static int find_vendor_oui(struct ib_mad_mgmt_vendor_class *vendor_class,
1262			   char *oui)
1263{
1264	int i;
1265
1266	for (i = 0; i < MAX_MGMT_OUI; i++)
1267		/* Is there matching OUI for this vendor class ? */
1268		if (!memcmp(vendor_class->oui[i], oui, 3))
1269			return i;
1270
1271	return -1;
1272}
1273
1274static int check_vendor_table(struct ib_mad_mgmt_vendor_class_table *vendor)
1275{
1276	int i;
1277
1278	for (i = 0; i < MAX_MGMT_VENDOR_RANGE2; i++)
1279		if (vendor->vendor_class[i])
1280			return 1;
1281
1282	return 0;
1283}
1284
1285static void remove_methods_mad_agent(struct ib_mad_mgmt_method_table *method,
1286				     struct ib_mad_agent_private *agent)
1287{
1288	int i;
1289
1290	/* Remove any methods for this mad agent */
1291	for (i = 0; i < IB_MGMT_MAX_METHODS; i++) {
1292		if (method->agent[i] == agent) {
1293			method->agent[i] = NULL;
1294		}
1295	}
1296}
1297
1298static int add_nonoui_reg_req(struct ib_mad_reg_req *mad_reg_req,
1299			      struct ib_mad_agent_private *agent_priv,
1300			      u8 mgmt_class)
1301{
1302	struct ib_mad_port_private *port_priv;
1303	struct ib_mad_mgmt_class_table **class;
1304	struct ib_mad_mgmt_method_table **method;
1305	int i, ret;
1306
1307	port_priv = agent_priv->qp_info->port_priv;
1308	class = &port_priv->version[mad_reg_req->mgmt_class_version].class;
1309	if (!*class) {
1310		/* Allocate management class table for "new" class version */
1311		*class = kzalloc(sizeof **class, GFP_ATOMIC);
1312		if (!*class) {
1313			printk(KERN_ERR PFX "No memory for "
1314			       "ib_mad_mgmt_class_table\n");
1315			ret = -ENOMEM;
1316			goto error1;
1317		}
1318
1319		/* Allocate method table for this management class */
1320		method = &(*class)->method_table[mgmt_class];
1321		if ((ret = allocate_method_table(method)))
1322			goto error2;
1323	} else {
1324		method = &(*class)->method_table[mgmt_class];
1325		if (!*method) {
1326			/* Allocate method table for this management class */
1327			if ((ret = allocate_method_table(method)))
1328				goto error1;
1329		}
1330	}
1331
1332	/* Now, make sure methods are not already in use */
1333	if (method_in_use(method, mad_reg_req))
1334		goto error3;
1335
1336	/* Finally, add in methods being registered */
1337	for_each_set_bit(i, mad_reg_req->method_mask, IB_MGMT_MAX_METHODS)
1338		(*method)->agent[i] = agent_priv;
1339
1340	return 0;
1341
1342error3:
1343	/* Remove any methods for this mad agent */
1344	remove_methods_mad_agent(*method, agent_priv);
1345	/* Now, check to see if there are any methods in use */
1346	if (!check_method_table(*method)) {
1347		/* If not, release management method table */
1348		kfree(*method);
1349		*method = NULL;
1350	}
1351	ret = -EINVAL;
1352	goto error1;
1353error2:
1354	kfree(*class);
1355	*class = NULL;
1356error1:
1357	return ret;
1358}
1359
1360static int add_oui_reg_req(struct ib_mad_reg_req *mad_reg_req,
1361			   struct ib_mad_agent_private *agent_priv)
1362{
1363	struct ib_mad_port_private *port_priv;
1364	struct ib_mad_mgmt_vendor_class_table **vendor_table;
1365	struct ib_mad_mgmt_vendor_class_table *vendor = NULL;
1366	struct ib_mad_mgmt_vendor_class *vendor_class = NULL;
1367	struct ib_mad_mgmt_method_table **method;
1368	int i, ret = -ENOMEM;
1369	u8 vclass;
1370
1371	/* "New" vendor (with OUI) class */
1372	vclass = vendor_class_index(mad_reg_req->mgmt_class);
1373	port_priv = agent_priv->qp_info->port_priv;
1374	vendor_table = &port_priv->version[
1375				mad_reg_req->mgmt_class_version].vendor;
1376	if (!*vendor_table) {
1377		/* Allocate mgmt vendor class table for "new" class version */
1378		vendor = kzalloc(sizeof *vendor, GFP_ATOMIC);
1379		if (!vendor) {
1380			printk(KERN_ERR PFX "No memory for "
1381			       "ib_mad_mgmt_vendor_class_table\n");
1382			goto error1;
1383		}
1384
1385		*vendor_table = vendor;
1386	}
1387	if (!(*vendor_table)->vendor_class[vclass]) {
1388		/* Allocate table for this management vendor class */
1389		vendor_class = kzalloc(sizeof *vendor_class, GFP_ATOMIC);
1390		if (!vendor_class) {
1391			printk(KERN_ERR PFX "No memory for "
1392			       "ib_mad_mgmt_vendor_class\n");
1393			goto error2;
1394		}
1395
1396		(*vendor_table)->vendor_class[vclass] = vendor_class;
1397	}
1398	for (i = 0; i < MAX_MGMT_OUI; i++) {
1399		/* Is there matching OUI for this vendor class ? */
1400		if (!memcmp((*vendor_table)->vendor_class[vclass]->oui[i],
1401			    mad_reg_req->oui, 3)) {
1402			method = &(*vendor_table)->vendor_class[
1403						vclass]->method_table[i];
1404			BUG_ON(!*method);
 
1405			goto check_in_use;
1406		}
1407	}
1408	for (i = 0; i < MAX_MGMT_OUI; i++) {
1409		/* OUI slot available ? */
1410		if (!is_vendor_oui((*vendor_table)->vendor_class[
1411				vclass]->oui[i])) {
1412			method = &(*vendor_table)->vendor_class[
1413				vclass]->method_table[i];
1414			BUG_ON(*method);
1415			/* Allocate method table for this OUI */
1416			if ((ret = allocate_method_table(method)))
1417				goto error3;
 
 
 
1418			memcpy((*vendor_table)->vendor_class[vclass]->oui[i],
1419			       mad_reg_req->oui, 3);
1420			goto check_in_use;
1421		}
1422	}
1423	printk(KERN_ERR PFX "All OUI slots in use\n");
1424	goto error3;
1425
1426check_in_use:
1427	/* Now, make sure methods are not already in use */
1428	if (method_in_use(method, mad_reg_req))
1429		goto error4;
1430
1431	/* Finally, add in methods being registered */
1432	for_each_set_bit(i, mad_reg_req->method_mask, IB_MGMT_MAX_METHODS)
1433		(*method)->agent[i] = agent_priv;
1434
1435	return 0;
1436
1437error4:
1438	/* Remove any methods for this mad agent */
1439	remove_methods_mad_agent(*method, agent_priv);
1440	/* Now, check to see if there are any methods in use */
1441	if (!check_method_table(*method)) {
1442		/* If not, release management method table */
1443		kfree(*method);
1444		*method = NULL;
1445	}
1446	ret = -EINVAL;
1447error3:
1448	if (vendor_class) {
1449		(*vendor_table)->vendor_class[vclass] = NULL;
1450		kfree(vendor_class);
1451	}
1452error2:
1453	if (vendor) {
1454		*vendor_table = NULL;
1455		kfree(vendor);
1456	}
1457error1:
1458	return ret;
1459}
1460
1461static void remove_mad_reg_req(struct ib_mad_agent_private *agent_priv)
1462{
1463	struct ib_mad_port_private *port_priv;
1464	struct ib_mad_mgmt_class_table *class;
1465	struct ib_mad_mgmt_method_table *method;
1466	struct ib_mad_mgmt_vendor_class_table *vendor;
1467	struct ib_mad_mgmt_vendor_class *vendor_class;
1468	int index;
1469	u8 mgmt_class;
1470
1471	/*
1472	 * Was MAD registration request supplied
1473	 * with original registration ?
1474	 */
1475	if (!agent_priv->reg_req) {
1476		goto out;
1477	}
1478
1479	port_priv = agent_priv->qp_info->port_priv;
1480	mgmt_class = convert_mgmt_class(agent_priv->reg_req->mgmt_class);
1481	class = port_priv->version[
1482			agent_priv->reg_req->mgmt_class_version].class;
1483	if (!class)
1484		goto vendor_check;
1485
1486	method = class->method_table[mgmt_class];
1487	if (method) {
1488		/* Remove any methods for this mad agent */
1489		remove_methods_mad_agent(method, agent_priv);
1490		/* Now, check to see if there are any methods still in use */
1491		if (!check_method_table(method)) {
1492			/* If not, release management method table */
1493			 kfree(method);
1494			 class->method_table[mgmt_class] = NULL;
1495			 /* Any management classes left ? */
1496			if (!check_class_table(class)) {
1497				/* If not, release management class table */
1498				kfree(class);
1499				port_priv->version[
1500					agent_priv->reg_req->
1501					mgmt_class_version].class = NULL;
1502			}
1503		}
1504	}
1505
1506vendor_check:
1507	if (!is_vendor_class(mgmt_class))
1508		goto out;
1509
1510	/* normalize mgmt_class to vendor range 2 */
1511	mgmt_class = vendor_class_index(agent_priv->reg_req->mgmt_class);
1512	vendor = port_priv->version[
1513			agent_priv->reg_req->mgmt_class_version].vendor;
1514
1515	if (!vendor)
1516		goto out;
1517
1518	vendor_class = vendor->vendor_class[mgmt_class];
1519	if (vendor_class) {
1520		index = find_vendor_oui(vendor_class, agent_priv->reg_req->oui);
1521		if (index < 0)
1522			goto out;
1523		method = vendor_class->method_table[index];
1524		if (method) {
1525			/* Remove any methods for this mad agent */
1526			remove_methods_mad_agent(method, agent_priv);
1527			/*
1528			 * Now, check to see if there are
1529			 * any methods still in use
1530			 */
1531			if (!check_method_table(method)) {
1532				/* If not, release management method table */
1533				kfree(method);
1534				vendor_class->method_table[index] = NULL;
1535				memset(vendor_class->oui[index], 0, 3);
1536				/* Any OUIs left ? */
1537				if (!check_vendor_class(vendor_class)) {
1538					/* If not, release vendor class table */
1539					kfree(vendor_class);
1540					vendor->vendor_class[mgmt_class] = NULL;
1541					/* Any other vendor classes left ? */
1542					if (!check_vendor_table(vendor)) {
1543						kfree(vendor);
1544						port_priv->version[
1545							agent_priv->reg_req->
1546							mgmt_class_version].
1547							vendor = NULL;
1548					}
1549				}
1550			}
1551		}
1552	}
1553
1554out:
1555	return;
1556}
1557
1558static struct ib_mad_agent_private *
1559find_mad_agent(struct ib_mad_port_private *port_priv,
1560	       struct ib_mad *mad)
1561{
1562	struct ib_mad_agent_private *mad_agent = NULL;
1563	unsigned long flags;
1564
1565	spin_lock_irqsave(&port_priv->reg_lock, flags);
1566	if (ib_response_mad(mad)) {
1567		u32 hi_tid;
1568		struct ib_mad_agent_private *entry;
1569
1570		/*
1571		 * Routing is based on high 32 bits of transaction ID
1572		 * of MAD.
1573		 */
1574		hi_tid = be64_to_cpu(mad->mad_hdr.tid) >> 32;
1575		list_for_each_entry(entry, &port_priv->agent_list, agent_list) {
1576			if (entry->agent.hi_tid == hi_tid) {
1577				mad_agent = entry;
1578				break;
1579			}
1580		}
1581	} else {
1582		struct ib_mad_mgmt_class_table *class;
1583		struct ib_mad_mgmt_method_table *method;
1584		struct ib_mad_mgmt_vendor_class_table *vendor;
1585		struct ib_mad_mgmt_vendor_class *vendor_class;
1586		struct ib_vendor_mad *vendor_mad;
1587		int index;
1588
 
1589		/*
1590		 * Routing is based on version, class, and method
1591		 * For "newer" vendor MADs, also based on OUI
1592		 */
1593		if (mad->mad_hdr.class_version >= MAX_MGMT_VERSION)
1594			goto out;
1595		if (!is_vendor_class(mad->mad_hdr.mgmt_class)) {
1596			class = port_priv->version[
1597					mad->mad_hdr.class_version].class;
1598			if (!class)
1599				goto out;
1600			if (convert_mgmt_class(mad->mad_hdr.mgmt_class) >=
1601			    IB_MGMT_MAX_METHODS)
1602				goto out;
1603			method = class->method_table[convert_mgmt_class(
1604							mad->mad_hdr.mgmt_class)];
1605			if (method)
1606				mad_agent = method->agent[mad->mad_hdr.method &
1607							  ~IB_MGMT_METHOD_RESP];
1608		} else {
1609			vendor = port_priv->version[
1610					mad->mad_hdr.class_version].vendor;
1611			if (!vendor)
1612				goto out;
1613			vendor_class = vendor->vendor_class[vendor_class_index(
1614						mad->mad_hdr.mgmt_class)];
1615			if (!vendor_class)
1616				goto out;
1617			/* Find matching OUI */
1618			vendor_mad = (struct ib_vendor_mad *)mad;
1619			index = find_vendor_oui(vendor_class, vendor_mad->oui);
1620			if (index == -1)
1621				goto out;
1622			method = vendor_class->method_table[index];
1623			if (method) {
1624				mad_agent = method->agent[mad->mad_hdr.method &
1625							  ~IB_MGMT_METHOD_RESP];
1626			}
1627		}
 
 
 
 
1628	}
1629
1630	if (mad_agent) {
1631		if (mad_agent->agent.recv_handler)
1632			atomic_inc(&mad_agent->refcount);
1633		else {
1634			printk(KERN_NOTICE PFX "No receive handler for client "
1635			       "%p on port %d\n",
1636			       &mad_agent->agent, port_priv->port_num);
1637			mad_agent = NULL;
1638		}
1639	}
1640out:
1641	spin_unlock_irqrestore(&port_priv->reg_lock, flags);
1642
1643	return mad_agent;
1644}
1645
1646static int validate_mad(struct ib_mad *mad, u32 qp_num)
 
 
1647{
1648	int valid = 0;
 
1649
1650	/* Make sure MAD base version is understood */
1651	if (mad->mad_hdr.base_version != IB_MGMT_BASE_VERSION) {
1652		printk(KERN_ERR PFX "MAD received with unsupported base "
1653		       "version %d\n", mad->mad_hdr.base_version);
 
1654		goto out;
1655	}
1656
1657	/* Filter SMI packets sent to other than QP0 */
1658	if ((mad->mad_hdr.mgmt_class == IB_MGMT_CLASS_SUBN_LID_ROUTED) ||
1659	    (mad->mad_hdr.mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)) {
1660		if (qp_num == 0)
1661			valid = 1;
1662	} else {
 
 
 
 
 
1663		/* Filter GSI packets sent to QP0 */
1664		if (qp_num != 0)
1665			valid = 1;
1666	}
1667
1668out:
1669	return valid;
1670}
1671
1672static int is_data_mad(struct ib_mad_agent_private *mad_agent_priv,
1673		       struct ib_mad_hdr *mad_hdr)
1674{
1675	struct ib_rmpp_mad *rmpp_mad;
1676
1677	rmpp_mad = (struct ib_rmpp_mad *)mad_hdr;
1678	return !mad_agent_priv->agent.rmpp_version ||
 
1679		!(ib_get_rmpp_flags(&rmpp_mad->rmpp_hdr) &
1680				    IB_MGMT_RMPP_FLAG_ACTIVE) ||
1681		(rmpp_mad->rmpp_hdr.rmpp_type == IB_MGMT_RMPP_TYPE_DATA);
1682}
1683
1684static inline int rcv_has_same_class(struct ib_mad_send_wr_private *wr,
1685				     struct ib_mad_recv_wc *rwc)
1686{
1687	return ((struct ib_mad *)(wr->send_buf.mad))->mad_hdr.mgmt_class ==
1688		rwc->recv_buf.mad->mad_hdr.mgmt_class;
1689}
1690
1691static inline int rcv_has_same_gid(struct ib_mad_agent_private *mad_agent_priv,
1692				   struct ib_mad_send_wr_private *wr,
1693				   struct ib_mad_recv_wc *rwc )
 
1694{
1695	struct ib_ah_attr attr;
1696	u8 send_resp, rcv_resp;
1697	union ib_gid sgid;
1698	struct ib_device *device = mad_agent_priv->agent.device;
1699	u8 port_num = mad_agent_priv->agent.port_num;
1700	u8 lmc;
 
1701
1702	send_resp = ib_response_mad((struct ib_mad *)wr->send_buf.mad);
1703	rcv_resp = ib_response_mad(rwc->recv_buf.mad);
1704
1705	if (send_resp == rcv_resp)
1706		/* both requests, or both responses. GIDs different */
1707		return 0;
1708
1709	if (ib_query_ah(wr->send_buf.ah, &attr))
1710		/* Assume not equal, to avoid false positives. */
1711		return 0;
1712
1713	if (!!(attr.ah_flags & IB_AH_GRH) !=
1714	    !!(rwc->wc->wc_flags & IB_WC_GRH))
1715		/* one has GID, other does not.  Assume different */
1716		return 0;
1717
1718	if (!send_resp && rcv_resp) {
1719		/* is request/response. */
1720		if (!(attr.ah_flags & IB_AH_GRH)) {
1721			if (ib_get_cached_lmc(device, port_num, &lmc))
1722				return 0;
1723			return (!lmc || !((attr.src_path_bits ^
1724					   rwc->wc->dlid_path_bits) &
1725					  ((1 << lmc) - 1)));
1726		} else {
1727			if (ib_get_cached_gid(device, port_num,
1728					      attr.grh.sgid_index, &sgid))
 
 
 
1729				return 0;
1730			return !memcmp(sgid.raw, rwc->recv_buf.grh->dgid.raw,
1731				       16);
1732		}
1733	}
1734
1735	if (!(attr.ah_flags & IB_AH_GRH))
1736		return attr.dlid == rwc->wc->slid;
1737	else
1738		return !memcmp(attr.grh.dgid.raw, rwc->recv_buf.grh->sgid.raw,
 
1739			       16);
1740}
1741
1742static inline int is_direct(u8 class)
1743{
1744	return (class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE);
1745}
1746
1747struct ib_mad_send_wr_private*
1748ib_find_send_mad(struct ib_mad_agent_private *mad_agent_priv,
1749		 struct ib_mad_recv_wc *wc)
1750{
1751	struct ib_mad_send_wr_private *wr;
1752	struct ib_mad *mad;
1753
1754	mad = (struct ib_mad *)wc->recv_buf.mad;
1755
1756	list_for_each_entry(wr, &mad_agent_priv->wait_list, agent_list) {
1757		if ((wr->tid == mad->mad_hdr.tid) &&
1758		    rcv_has_same_class(wr, wc) &&
1759		    /*
1760		     * Don't check GID for direct routed MADs.
1761		     * These might have permissive LIDs.
1762		     */
1763		    (is_direct(wc->recv_buf.mad->mad_hdr.mgmt_class) ||
1764		     rcv_has_same_gid(mad_agent_priv, wr, wc)))
1765			return (wr->status == IB_WC_SUCCESS) ? wr : NULL;
1766	}
1767
1768	/*
1769	 * It's possible to receive the response before we've
1770	 * been notified that the send has completed
1771	 */
1772	list_for_each_entry(wr, &mad_agent_priv->send_list, agent_list) {
1773		if (is_data_mad(mad_agent_priv, wr->send_buf.mad) &&
1774		    wr->tid == mad->mad_hdr.tid &&
1775		    wr->timeout &&
1776		    rcv_has_same_class(wr, wc) &&
1777		    /*
1778		     * Don't check GID for direct routed MADs.
1779		     * These might have permissive LIDs.
1780		     */
1781		    (is_direct(wc->recv_buf.mad->mad_hdr.mgmt_class) ||
1782		     rcv_has_same_gid(mad_agent_priv, wr, wc)))
1783			/* Verify request has not been canceled */
1784			return (wr->status == IB_WC_SUCCESS) ? wr : NULL;
1785	}
1786	return NULL;
1787}
1788
1789void ib_mark_mad_done(struct ib_mad_send_wr_private *mad_send_wr)
1790{
1791	mad_send_wr->timeout = 0;
1792	if (mad_send_wr->refcount == 1)
1793		list_move_tail(&mad_send_wr->agent_list,
1794			      &mad_send_wr->mad_agent_priv->done_list);
1795}
1796
1797static void ib_mad_complete_recv(struct ib_mad_agent_private *mad_agent_priv,
1798				 struct ib_mad_recv_wc *mad_recv_wc)
1799{
1800	struct ib_mad_send_wr_private *mad_send_wr;
1801	struct ib_mad_send_wc mad_send_wc;
1802	unsigned long flags;
 
1803
1804	INIT_LIST_HEAD(&mad_recv_wc->rmpp_list);
 
 
 
 
 
 
 
 
1805	list_add(&mad_recv_wc->recv_buf.list, &mad_recv_wc->rmpp_list);
1806	if (mad_agent_priv->agent.rmpp_version) {
1807		mad_recv_wc = ib_process_rmpp_recv_wc(mad_agent_priv,
1808						      mad_recv_wc);
1809		if (!mad_recv_wc) {
1810			deref_mad_agent(mad_agent_priv);
1811			return;
1812		}
1813	}
1814
1815	/* Complete corresponding request */
1816	if (ib_response_mad(mad_recv_wc->recv_buf.mad)) {
1817		spin_lock_irqsave(&mad_agent_priv->lock, flags);
1818		mad_send_wr = ib_find_send_mad(mad_agent_priv, mad_recv_wc);
1819		if (!mad_send_wr) {
1820			spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1821			ib_free_recv_mad(mad_recv_wc);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1822			deref_mad_agent(mad_agent_priv);
1823			return;
 
 
 
 
1824		}
1825		ib_mark_mad_done(mad_send_wr);
1826		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1827
1828		/* Defined behavior is to complete response before request */
1829		mad_recv_wc->wc->wr_id = (unsigned long) &mad_send_wr->send_buf;
1830		mad_agent_priv->agent.recv_handler(&mad_agent_priv->agent,
1831						   mad_recv_wc);
1832		atomic_dec(&mad_agent_priv->refcount);
1833
1834		mad_send_wc.status = IB_WC_SUCCESS;
1835		mad_send_wc.vendor_err = 0;
1836		mad_send_wc.send_buf = &mad_send_wr->send_buf;
1837		ib_mad_complete_send_wr(mad_send_wr, &mad_send_wc);
1838	} else {
1839		mad_agent_priv->agent.recv_handler(&mad_agent_priv->agent,
1840						   mad_recv_wc);
1841		deref_mad_agent(mad_agent_priv);
1842	}
1843}
1844
1845static bool generate_unmatched_resp(struct ib_mad_private *recv,
1846				    struct ib_mad_private *response)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1847{
1848	if (recv->mad.mad.mad_hdr.method == IB_MGMT_METHOD_GET ||
1849	    recv->mad.mad.mad_hdr.method == IB_MGMT_METHOD_SET) {
1850		memcpy(response, recv, sizeof *response);
 
 
 
1851		response->header.recv_wc.wc = &response->header.wc;
1852		response->header.recv_wc.recv_buf.mad = &response->mad.mad;
1853		response->header.recv_wc.recv_buf.grh = &response->grh;
1854		response->mad.mad.mad_hdr.method = IB_MGMT_METHOD_GET_RESP;
1855		response->mad.mad.mad_hdr.status =
1856			cpu_to_be16(IB_MGMT_MAD_STATUS_UNSUPPORTED_METHOD_ATTRIB);
1857		if (recv->mad.mad.mad_hdr.mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)
1858			response->mad.mad.mad_hdr.status |= IB_SMP_DIRECTION;
 
 
 
 
 
 
 
 
 
 
1859
1860		return true;
1861	} else {
1862		return false;
1863	}
1864}
1865static void ib_mad_recv_done_handler(struct ib_mad_port_private *port_priv,
1866				     struct ib_wc *wc)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1867{
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1868	struct ib_mad_qp_info *qp_info;
1869	struct ib_mad_private_header *mad_priv_hdr;
1870	struct ib_mad_private *recv, *response = NULL;
1871	struct ib_mad_list_head *mad_list;
1872	struct ib_mad_agent_private *mad_agent;
1873	int port_num;
1874	int ret = IB_MAD_RESULT_SUCCESS;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1875
1876	mad_list = (struct ib_mad_list_head *)(unsigned long)wc->wr_id;
1877	qp_info = mad_list->mad_queue->qp_info;
1878	dequeue_mad(mad_list);
1879
 
 
 
1880	mad_priv_hdr = container_of(mad_list, struct ib_mad_private_header,
1881				    mad_list);
1882	recv = container_of(mad_priv_hdr, struct ib_mad_private, header);
1883	ib_dma_unmap_single(port_priv->device,
1884			    recv->header.mapping,
1885			    sizeof(struct ib_mad_private) -
1886			      sizeof(struct ib_mad_private_header),
1887			    DMA_FROM_DEVICE);
1888
1889	/* Setup MAD receive work completion from "normal" work completion */
1890	recv->header.wc = *wc;
1891	recv->header.recv_wc.wc = &recv->header.wc;
1892	recv->header.recv_wc.mad_len = sizeof(struct ib_mad);
1893	recv->header.recv_wc.recv_buf.mad = &recv->mad.mad;
 
 
 
 
 
 
 
 
1894	recv->header.recv_wc.recv_buf.grh = &recv->grh;
1895
1896	if (atomic_read(&qp_info->snoop_count))
1897		snoop_recv(qp_info, &recv->header.recv_wc, IB_MAD_SNOOP_RECVS);
1898
1899	/* Validate MAD */
1900	if (!validate_mad(&recv->mad.mad, qp_info->qp->qp_num))
1901		goto out;
1902
1903	response = kmem_cache_alloc(ib_mad_cache, GFP_KERNEL);
1904	if (!response) {
1905		printk(KERN_ERR PFX "ib_mad_recv_done_handler no memory "
1906		       "for response buffer\n");
 
 
1907		goto out;
1908	}
1909
1910	if (port_priv->device->node_type == RDMA_NODE_IB_SWITCH)
1911		port_num = wc->port_num;
1912	else
1913		port_num = port_priv->port_num;
1914
1915	if (recv->mad.mad.mad_hdr.mgmt_class ==
1916	    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE) {
1917		enum smi_forward_action retsmi;
1918
1919		if (smi_handle_dr_smp_recv(&recv->mad.smp,
1920					   port_priv->device->node_type,
1921					   port_num,
1922					   port_priv->device->phys_port_cnt) ==
1923					   IB_SMI_DISCARD)
1924			goto out;
 
1925
1926		retsmi = smi_check_forward_dr_smp(&recv->mad.smp);
1927		if (retsmi == IB_SMI_LOCAL)
1928			goto local;
1929
1930		if (retsmi == IB_SMI_SEND) { /* don't forward */
1931			if (smi_handle_dr_smp_send(&recv->mad.smp,
1932						   port_priv->device->node_type,
1933						   port_num) == IB_SMI_DISCARD)
1934				goto out;
1935
1936			if (smi_check_local_smp(&recv->mad.smp, port_priv->device) == IB_SMI_DISCARD)
1937				goto out;
1938		} else if (port_priv->device->node_type == RDMA_NODE_IB_SWITCH) {
1939			/* forward case for switches */
1940			memcpy(response, recv, sizeof(*response));
1941			response->header.recv_wc.wc = &response->header.wc;
1942			response->header.recv_wc.recv_buf.mad = &response->mad.mad;
1943			response->header.recv_wc.recv_buf.grh = &response->grh;
1944
1945			agent_send_response(&response->mad.mad,
1946					    &response->grh, wc,
1947					    port_priv->device,
1948					    smi_get_fwd_port(&recv->mad.smp),
1949					    qp_info->qp->qp_num);
1950
1951			goto out;
1952		}
1953	}
1954
1955local:
1956	/* Give driver "right of first refusal" on incoming MAD */
1957	if (port_priv->device->process_mad) {
1958		ret = port_priv->device->process_mad(port_priv->device, 0,
1959						     port_priv->port_num,
1960						     wc, &recv->grh,
1961						     &recv->mad.mad,
1962						     &response->mad.mad);
1963		if (ret & IB_MAD_RESULT_SUCCESS) {
1964			if (ret & IB_MAD_RESULT_CONSUMED)
1965				goto out;
1966			if (ret & IB_MAD_RESULT_REPLY) {
1967				agent_send_response(&response->mad.mad,
1968						    &recv->grh, wc,
1969						    port_priv->device,
1970						    port_num,
1971						    qp_info->qp->qp_num);
 
1972				goto out;
1973			}
1974		}
1975	}
1976
1977	mad_agent = find_mad_agent(port_priv, &recv->mad.mad);
1978	if (mad_agent) {
 
1979		ib_mad_complete_recv(mad_agent, &recv->header.recv_wc);
1980		/*
1981		 * recv is freed up in error cases in ib_mad_complete_recv
1982		 * or via recv_handler in ib_mad_complete_recv()
1983		 */
1984		recv = NULL;
1985	} else if ((ret & IB_MAD_RESULT_SUCCESS) &&
1986		   generate_unmatched_resp(recv, response)) {
1987		agent_send_response(&response->mad.mad, &recv->grh, wc,
1988				    port_priv->device, port_num, qp_info->qp->qp_num);
 
1989	}
1990
1991out:
1992	/* Post another receive request for this QP */
1993	if (response) {
1994		ib_mad_post_receive_mads(qp_info, response);
1995		if (recv)
1996			kmem_cache_free(ib_mad_cache, recv);
1997	} else
1998		ib_mad_post_receive_mads(qp_info, recv);
1999}
2000
2001static void adjust_timeout(struct ib_mad_agent_private *mad_agent_priv)
2002{
2003	struct ib_mad_send_wr_private *mad_send_wr;
2004	unsigned long delay;
2005
2006	if (list_empty(&mad_agent_priv->wait_list)) {
2007		__cancel_delayed_work(&mad_agent_priv->timed_work);
2008	} else {
2009		mad_send_wr = list_entry(mad_agent_priv->wait_list.next,
2010					 struct ib_mad_send_wr_private,
2011					 agent_list);
2012
2013		if (time_after(mad_agent_priv->timeout,
2014			       mad_send_wr->timeout)) {
2015			mad_agent_priv->timeout = mad_send_wr->timeout;
2016			__cancel_delayed_work(&mad_agent_priv->timed_work);
2017			delay = mad_send_wr->timeout - jiffies;
2018			if ((long)delay <= 0)
2019				delay = 1;
2020			queue_delayed_work(mad_agent_priv->qp_info->
2021					   port_priv->wq,
2022					   &mad_agent_priv->timed_work, delay);
2023		}
2024	}
2025}
2026
2027static void wait_for_response(struct ib_mad_send_wr_private *mad_send_wr)
2028{
2029	struct ib_mad_agent_private *mad_agent_priv;
2030	struct ib_mad_send_wr_private *temp_mad_send_wr;
2031	struct list_head *list_item;
2032	unsigned long delay;
2033
2034	mad_agent_priv = mad_send_wr->mad_agent_priv;
2035	list_del(&mad_send_wr->agent_list);
2036
2037	delay = mad_send_wr->timeout;
2038	mad_send_wr->timeout += jiffies;
2039
2040	if (delay) {
2041		list_for_each_prev(list_item, &mad_agent_priv->wait_list) {
2042			temp_mad_send_wr = list_entry(list_item,
2043						struct ib_mad_send_wr_private,
2044						agent_list);
2045			if (time_after(mad_send_wr->timeout,
2046				       temp_mad_send_wr->timeout))
2047				break;
2048		}
 
 
2049	}
2050	else
2051		list_item = &mad_agent_priv->wait_list;
2052	list_add(&mad_send_wr->agent_list, list_item);
2053
2054	/* Reschedule a work item if we have a shorter timeout */
2055	if (mad_agent_priv->wait_list.next == &mad_send_wr->agent_list) {
2056		__cancel_delayed_work(&mad_agent_priv->timed_work);
2057		queue_delayed_work(mad_agent_priv->qp_info->port_priv->wq,
2058				   &mad_agent_priv->timed_work, delay);
2059	}
2060}
2061
2062void ib_reset_mad_timeout(struct ib_mad_send_wr_private *mad_send_wr,
2063			  int timeout_ms)
2064{
2065	mad_send_wr->timeout = msecs_to_jiffies(timeout_ms);
2066	wait_for_response(mad_send_wr);
2067}
2068
2069/*
2070 * Process a send work completion
2071 */
2072void ib_mad_complete_send_wr(struct ib_mad_send_wr_private *mad_send_wr,
2073			     struct ib_mad_send_wc *mad_send_wc)
2074{
2075	struct ib_mad_agent_private	*mad_agent_priv;
2076	unsigned long			flags;
2077	int				ret;
2078
2079	mad_agent_priv = mad_send_wr->mad_agent_priv;
2080	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2081	if (mad_agent_priv->agent.rmpp_version) {
2082		ret = ib_process_rmpp_send_wc(mad_send_wr, mad_send_wc);
2083		if (ret == IB_RMPP_RESULT_CONSUMED)
2084			goto done;
2085	} else
2086		ret = IB_RMPP_RESULT_UNHANDLED;
2087
2088	if (mad_send_wc->status != IB_WC_SUCCESS &&
2089	    mad_send_wr->status == IB_WC_SUCCESS) {
2090		mad_send_wr->status = mad_send_wc->status;
2091		mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2092	}
2093
2094	if (--mad_send_wr->refcount > 0) {
2095		if (mad_send_wr->refcount == 1 && mad_send_wr->timeout &&
2096		    mad_send_wr->status == IB_WC_SUCCESS) {
2097			wait_for_response(mad_send_wr);
2098		}
2099		goto done;
2100	}
2101
2102	/* Remove send from MAD agent and notify client of completion */
2103	list_del(&mad_send_wr->agent_list);
2104	adjust_timeout(mad_agent_priv);
2105	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2106
2107	if (mad_send_wr->status != IB_WC_SUCCESS )
2108		mad_send_wc->status = mad_send_wr->status;
2109	if (ret == IB_RMPP_RESULT_INTERNAL)
2110		ib_rmpp_send_handler(mad_send_wc);
2111	else
2112		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2113						   mad_send_wc);
2114
2115	/* Release reference on agent taken when sending */
2116	deref_mad_agent(mad_agent_priv);
2117	return;
2118done:
2119	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2120}
2121
2122static void ib_mad_send_done_handler(struct ib_mad_port_private *port_priv,
2123				     struct ib_wc *wc)
2124{
 
 
 
2125	struct ib_mad_send_wr_private	*mad_send_wr, *queued_send_wr;
2126	struct ib_mad_list_head		*mad_list;
2127	struct ib_mad_qp_info		*qp_info;
2128	struct ib_mad_queue		*send_queue;
2129	struct ib_send_wr		*bad_send_wr;
2130	struct ib_mad_send_wc		mad_send_wc;
2131	unsigned long flags;
2132	int ret;
2133
2134	mad_list = (struct ib_mad_list_head *)(unsigned long)wc->wr_id;
 
 
 
 
 
 
 
2135	mad_send_wr = container_of(mad_list, struct ib_mad_send_wr_private,
2136				   mad_list);
2137	send_queue = mad_list->mad_queue;
2138	qp_info = send_queue->qp_info;
2139
 
 
 
2140retry:
2141	ib_dma_unmap_single(mad_send_wr->send_buf.mad_agent->device,
2142			    mad_send_wr->header_mapping,
2143			    mad_send_wr->sg_list[0].length, DMA_TO_DEVICE);
2144	ib_dma_unmap_single(mad_send_wr->send_buf.mad_agent->device,
2145			    mad_send_wr->payload_mapping,
2146			    mad_send_wr->sg_list[1].length, DMA_TO_DEVICE);
2147	queued_send_wr = NULL;
2148	spin_lock_irqsave(&send_queue->lock, flags);
2149	list_del(&mad_list->list);
2150
2151	/* Move queued send to the send queue */
2152	if (send_queue->count-- > send_queue->max_active) {
2153		mad_list = container_of(qp_info->overflow_list.next,
2154					struct ib_mad_list_head, list);
2155		queued_send_wr = container_of(mad_list,
2156					struct ib_mad_send_wr_private,
2157					mad_list);
2158		list_move_tail(&mad_list->list, &send_queue->list);
2159	}
2160	spin_unlock_irqrestore(&send_queue->lock, flags);
2161
2162	mad_send_wc.send_buf = &mad_send_wr->send_buf;
2163	mad_send_wc.status = wc->status;
2164	mad_send_wc.vendor_err = wc->vendor_err;
2165	if (atomic_read(&qp_info->snoop_count))
2166		snoop_send(qp_info, &mad_send_wr->send_buf, &mad_send_wc,
2167			   IB_MAD_SNOOP_SEND_COMPLETIONS);
2168	ib_mad_complete_send_wr(mad_send_wr, &mad_send_wc);
2169
2170	if (queued_send_wr) {
2171		ret = ib_post_send(qp_info->qp, &queued_send_wr->send_wr,
2172				   &bad_send_wr);
 
2173		if (ret) {
2174			printk(KERN_ERR PFX "ib_post_send failed: %d\n", ret);
 
2175			mad_send_wr = queued_send_wr;
2176			wc->status = IB_WC_LOC_QP_OP_ERR;
2177			goto retry;
2178		}
2179	}
2180}
2181
2182static void mark_sends_for_retry(struct ib_mad_qp_info *qp_info)
2183{
2184	struct ib_mad_send_wr_private *mad_send_wr;
2185	struct ib_mad_list_head *mad_list;
2186	unsigned long flags;
2187
2188	spin_lock_irqsave(&qp_info->send_queue.lock, flags);
2189	list_for_each_entry(mad_list, &qp_info->send_queue.list, list) {
2190		mad_send_wr = container_of(mad_list,
2191					   struct ib_mad_send_wr_private,
2192					   mad_list);
2193		mad_send_wr->retry = 1;
2194	}
2195	spin_unlock_irqrestore(&qp_info->send_queue.lock, flags);
2196}
2197
2198static void mad_error_handler(struct ib_mad_port_private *port_priv,
2199			      struct ib_wc *wc)
2200{
2201	struct ib_mad_list_head *mad_list;
2202	struct ib_mad_qp_info *qp_info;
 
2203	struct ib_mad_send_wr_private *mad_send_wr;
2204	int ret;
2205
2206	/* Determine if failure was a send or receive */
2207	mad_list = (struct ib_mad_list_head *)(unsigned long)wc->wr_id;
2208	qp_info = mad_list->mad_queue->qp_info;
2209	if (mad_list->mad_queue == &qp_info->recv_queue)
2210		/*
2211		 * Receive errors indicate that the QP has entered the error
2212		 * state - error handling/shutdown code will cleanup
2213		 */
2214		return;
2215
2216	/*
2217	 * Send errors will transition the QP to SQE - move
2218	 * QP to RTS and repost flushed work requests
2219	 */
2220	mad_send_wr = container_of(mad_list, struct ib_mad_send_wr_private,
2221				   mad_list);
2222	if (wc->status == IB_WC_WR_FLUSH_ERR) {
2223		if (mad_send_wr->retry) {
2224			/* Repost send */
2225			struct ib_send_wr *bad_send_wr;
2226
2227			mad_send_wr->retry = 0;
2228			ret = ib_post_send(qp_info->qp, &mad_send_wr->send_wr,
2229					&bad_send_wr);
2230			if (ret)
2231				ib_mad_send_done_handler(port_priv, wc);
2232		} else
2233			ib_mad_send_done_handler(port_priv, wc);
2234	} else {
2235		struct ib_qp_attr *attr;
2236
2237		/* Transition QP to RTS and fail offending send */
2238		attr = kmalloc(sizeof *attr, GFP_KERNEL);
2239		if (attr) {
2240			attr->qp_state = IB_QPS_RTS;
2241			attr->cur_qp_state = IB_QPS_SQE;
2242			ret = ib_modify_qp(qp_info->qp, attr,
2243					   IB_QP_STATE | IB_QP_CUR_STATE);
2244			kfree(attr);
2245			if (ret)
2246				printk(KERN_ERR PFX "mad_error_handler - "
2247				       "ib_modify_qp to RTS : %d\n", ret);
 
2248			else
2249				mark_sends_for_retry(qp_info);
2250		}
2251		ib_mad_send_done_handler(port_priv, wc);
2252	}
2253}
2254
2255/*
2256 * IB MAD completion callback
2257 */
2258static void ib_mad_completion_handler(struct work_struct *work)
2259{
2260	struct ib_mad_port_private *port_priv;
2261	struct ib_wc wc;
2262
2263	port_priv = container_of(work, struct ib_mad_port_private, work);
2264	ib_req_notify_cq(port_priv->cq, IB_CQ_NEXT_COMP);
2265
2266	while (ib_poll_cq(port_priv->cq, 1, &wc) == 1) {
2267		if (wc.status == IB_WC_SUCCESS) {
2268			switch (wc.opcode) {
2269			case IB_WC_SEND:
2270				ib_mad_send_done_handler(port_priv, &wc);
2271				break;
2272			case IB_WC_RECV:
2273				ib_mad_recv_done_handler(port_priv, &wc);
2274				break;
2275			default:
2276				BUG_ON(1);
2277				break;
2278			}
2279		} else
2280			mad_error_handler(port_priv, &wc);
2281	}
2282}
2283
2284static void cancel_mads(struct ib_mad_agent_private *mad_agent_priv)
2285{
2286	unsigned long flags;
2287	struct ib_mad_send_wr_private *mad_send_wr, *temp_mad_send_wr;
2288	struct ib_mad_send_wc mad_send_wc;
2289	struct list_head cancel_list;
2290
2291	INIT_LIST_HEAD(&cancel_list);
2292
2293	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2294	list_for_each_entry_safe(mad_send_wr, temp_mad_send_wr,
2295				 &mad_agent_priv->send_list, agent_list) {
2296		if (mad_send_wr->status == IB_WC_SUCCESS) {
2297			mad_send_wr->status = IB_WC_WR_FLUSH_ERR;
2298			mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2299		}
2300	}
2301
2302	/* Empty wait list to prevent receives from finding a request */
2303	list_splice_init(&mad_agent_priv->wait_list, &cancel_list);
2304	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2305
2306	/* Report all cancelled requests */
2307	mad_send_wc.status = IB_WC_WR_FLUSH_ERR;
2308	mad_send_wc.vendor_err = 0;
2309
2310	list_for_each_entry_safe(mad_send_wr, temp_mad_send_wr,
2311				 &cancel_list, agent_list) {
2312		mad_send_wc.send_buf = &mad_send_wr->send_buf;
2313		list_del(&mad_send_wr->agent_list);
2314		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2315						   &mad_send_wc);
2316		atomic_dec(&mad_agent_priv->refcount);
2317	}
2318}
2319
2320static struct ib_mad_send_wr_private*
2321find_send_wr(struct ib_mad_agent_private *mad_agent_priv,
2322	     struct ib_mad_send_buf *send_buf)
2323{
2324	struct ib_mad_send_wr_private *mad_send_wr;
2325
2326	list_for_each_entry(mad_send_wr, &mad_agent_priv->wait_list,
2327			    agent_list) {
2328		if (&mad_send_wr->send_buf == send_buf)
2329			return mad_send_wr;
2330	}
2331
2332	list_for_each_entry(mad_send_wr, &mad_agent_priv->send_list,
2333			    agent_list) {
2334		if (is_data_mad(mad_agent_priv, mad_send_wr->send_buf.mad) &&
 
2335		    &mad_send_wr->send_buf == send_buf)
2336			return mad_send_wr;
2337	}
2338	return NULL;
2339}
2340
2341int ib_modify_mad(struct ib_mad_agent *mad_agent,
2342		  struct ib_mad_send_buf *send_buf, u32 timeout_ms)
2343{
2344	struct ib_mad_agent_private *mad_agent_priv;
2345	struct ib_mad_send_wr_private *mad_send_wr;
2346	unsigned long flags;
2347	int active;
2348
2349	mad_agent_priv = container_of(mad_agent, struct ib_mad_agent_private,
2350				      agent);
 
 
 
2351	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2352	mad_send_wr = find_send_wr(mad_agent_priv, send_buf);
2353	if (!mad_send_wr || mad_send_wr->status != IB_WC_SUCCESS) {
2354		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2355		return -EINVAL;
2356	}
2357
2358	active = (!mad_send_wr->timeout || mad_send_wr->refcount > 1);
2359	if (!timeout_ms) {
2360		mad_send_wr->status = IB_WC_WR_FLUSH_ERR;
2361		mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2362	}
2363
2364	mad_send_wr->send_buf.timeout_ms = timeout_ms;
2365	if (active)
2366		mad_send_wr->timeout = msecs_to_jiffies(timeout_ms);
2367	else
2368		ib_reset_mad_timeout(mad_send_wr, timeout_ms);
2369
2370	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2371	return 0;
2372}
2373EXPORT_SYMBOL(ib_modify_mad);
2374
2375void ib_cancel_mad(struct ib_mad_agent *mad_agent,
2376		   struct ib_mad_send_buf *send_buf)
2377{
2378	ib_modify_mad(mad_agent, send_buf, 0);
2379}
2380EXPORT_SYMBOL(ib_cancel_mad);
2381
2382static void local_completions(struct work_struct *work)
2383{
2384	struct ib_mad_agent_private *mad_agent_priv;
2385	struct ib_mad_local_private *local;
2386	struct ib_mad_agent_private *recv_mad_agent;
2387	unsigned long flags;
2388	int free_mad;
2389	struct ib_wc wc;
2390	struct ib_mad_send_wc mad_send_wc;
 
2391
2392	mad_agent_priv =
2393		container_of(work, struct ib_mad_agent_private, local_work);
2394
 
 
 
2395	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2396	while (!list_empty(&mad_agent_priv->local_list)) {
2397		local = list_entry(mad_agent_priv->local_list.next,
2398				   struct ib_mad_local_private,
2399				   completion_list);
2400		list_del(&local->completion_list);
2401		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2402		free_mad = 0;
2403		if (local->mad_priv) {
 
2404			recv_mad_agent = local->recv_mad_agent;
2405			if (!recv_mad_agent) {
2406				printk(KERN_ERR PFX "No receive MAD agent for local completion\n");
 
2407				free_mad = 1;
2408				goto local_send_completion;
2409			}
2410
2411			/*
2412			 * Defined behavior is to complete response
2413			 * before request
2414			 */
2415			build_smp_wc(recv_mad_agent->agent.qp,
2416				     (unsigned long) local->mad_send_wr,
2417				     be16_to_cpu(IB_LID_PERMISSIVE),
2418				     0, recv_mad_agent->agent.port_num, &wc);
 
2419
2420			local->mad_priv->header.recv_wc.wc = &wc;
2421			local->mad_priv->header.recv_wc.mad_len =
2422						sizeof(struct ib_mad);
 
 
 
 
 
 
 
 
2423			INIT_LIST_HEAD(&local->mad_priv->header.recv_wc.rmpp_list);
2424			list_add(&local->mad_priv->header.recv_wc.recv_buf.list,
2425				 &local->mad_priv->header.recv_wc.rmpp_list);
2426			local->mad_priv->header.recv_wc.recv_buf.grh = NULL;
2427			local->mad_priv->header.recv_wc.recv_buf.mad =
2428						&local->mad_priv->mad.mad;
2429			if (atomic_read(&recv_mad_agent->qp_info->snoop_count))
2430				snoop_recv(recv_mad_agent->qp_info,
2431					  &local->mad_priv->header.recv_wc,
2432					   IB_MAD_SNOOP_RECVS);
2433			recv_mad_agent->agent.recv_handler(
2434						&recv_mad_agent->agent,
 
2435						&local->mad_priv->header.recv_wc);
2436			spin_lock_irqsave(&recv_mad_agent->lock, flags);
2437			atomic_dec(&recv_mad_agent->refcount);
2438			spin_unlock_irqrestore(&recv_mad_agent->lock, flags);
2439		}
2440
2441local_send_completion:
2442		/* Complete send */
2443		mad_send_wc.status = IB_WC_SUCCESS;
2444		mad_send_wc.vendor_err = 0;
2445		mad_send_wc.send_buf = &local->mad_send_wr->send_buf;
2446		if (atomic_read(&mad_agent_priv->qp_info->snoop_count))
2447			snoop_send(mad_agent_priv->qp_info,
2448				   &local->mad_send_wr->send_buf,
2449				   &mad_send_wc, IB_MAD_SNOOP_SEND_COMPLETIONS);
2450		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2451						   &mad_send_wc);
2452
2453		spin_lock_irqsave(&mad_agent_priv->lock, flags);
2454		atomic_dec(&mad_agent_priv->refcount);
2455		if (free_mad)
2456			kmem_cache_free(ib_mad_cache, local->mad_priv);
2457		kfree(local);
2458	}
2459	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2460}
2461
2462static int retry_send(struct ib_mad_send_wr_private *mad_send_wr)
2463{
2464	int ret;
2465
2466	if (!mad_send_wr->retries_left)
2467		return -ETIMEDOUT;
2468
2469	mad_send_wr->retries_left--;
2470	mad_send_wr->send_buf.retries++;
2471
2472	mad_send_wr->timeout = msecs_to_jiffies(mad_send_wr->send_buf.timeout_ms);
2473
2474	if (mad_send_wr->mad_agent_priv->agent.rmpp_version) {
2475		ret = ib_retry_rmpp(mad_send_wr);
2476		switch (ret) {
2477		case IB_RMPP_RESULT_UNHANDLED:
2478			ret = ib_send_mad(mad_send_wr);
2479			break;
2480		case IB_RMPP_RESULT_CONSUMED:
2481			ret = 0;
2482			break;
2483		default:
2484			ret = -ECOMM;
2485			break;
2486		}
2487	} else
2488		ret = ib_send_mad(mad_send_wr);
2489
2490	if (!ret) {
2491		mad_send_wr->refcount++;
2492		list_add_tail(&mad_send_wr->agent_list,
2493			      &mad_send_wr->mad_agent_priv->send_list);
2494	}
2495	return ret;
2496}
2497
2498static void timeout_sends(struct work_struct *work)
2499{
2500	struct ib_mad_agent_private *mad_agent_priv;
2501	struct ib_mad_send_wr_private *mad_send_wr;
2502	struct ib_mad_send_wc mad_send_wc;
2503	unsigned long flags, delay;
2504
2505	mad_agent_priv = container_of(work, struct ib_mad_agent_private,
2506				      timed_work.work);
2507	mad_send_wc.vendor_err = 0;
2508
2509	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2510	while (!list_empty(&mad_agent_priv->wait_list)) {
2511		mad_send_wr = list_entry(mad_agent_priv->wait_list.next,
2512					 struct ib_mad_send_wr_private,
2513					 agent_list);
2514
2515		if (time_after(mad_send_wr->timeout, jiffies)) {
2516			delay = mad_send_wr->timeout - jiffies;
2517			if ((long)delay <= 0)
2518				delay = 1;
2519			queue_delayed_work(mad_agent_priv->qp_info->
2520					   port_priv->wq,
2521					   &mad_agent_priv->timed_work, delay);
2522			break;
2523		}
2524
2525		list_del(&mad_send_wr->agent_list);
2526		if (mad_send_wr->status == IB_WC_SUCCESS &&
2527		    !retry_send(mad_send_wr))
2528			continue;
2529
2530		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2531
2532		if (mad_send_wr->status == IB_WC_SUCCESS)
2533			mad_send_wc.status = IB_WC_RESP_TIMEOUT_ERR;
2534		else
2535			mad_send_wc.status = mad_send_wr->status;
2536		mad_send_wc.send_buf = &mad_send_wr->send_buf;
2537		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2538						   &mad_send_wc);
2539
2540		atomic_dec(&mad_agent_priv->refcount);
2541		spin_lock_irqsave(&mad_agent_priv->lock, flags);
2542	}
2543	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2544}
2545
2546static void ib_mad_thread_completion_handler(struct ib_cq *cq, void *arg)
2547{
2548	struct ib_mad_port_private *port_priv = cq->cq_context;
2549	unsigned long flags;
2550
2551	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2552	if (!list_empty(&port_priv->port_list))
2553		queue_work(port_priv->wq, &port_priv->work);
2554	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2555}
2556
2557/*
2558 * Allocate receive MADs and post receive WRs for them
2559 */
2560static int ib_mad_post_receive_mads(struct ib_mad_qp_info *qp_info,
2561				    struct ib_mad_private *mad)
2562{
2563	unsigned long flags;
2564	int post, ret;
2565	struct ib_mad_private *mad_priv;
2566	struct ib_sge sg_list;
2567	struct ib_recv_wr recv_wr, *bad_recv_wr;
2568	struct ib_mad_queue *recv_queue = &qp_info->recv_queue;
2569
2570	/* Initialize common scatter list fields */
2571	sg_list.length = sizeof *mad_priv - sizeof mad_priv->header;
2572	sg_list.lkey = (*qp_info->port_priv->mr).lkey;
2573
2574	/* Initialize common receive WR fields */
2575	recv_wr.next = NULL;
2576	recv_wr.sg_list = &sg_list;
2577	recv_wr.num_sge = 1;
2578
2579	do {
2580		/* Allocate and map receive buffer */
2581		if (mad) {
2582			mad_priv = mad;
2583			mad = NULL;
2584		} else {
2585			mad_priv = kmem_cache_alloc(ib_mad_cache, GFP_KERNEL);
 
2586			if (!mad_priv) {
2587				printk(KERN_ERR PFX "No memory for receive buffer\n");
2588				ret = -ENOMEM;
2589				break;
2590			}
2591		}
 
2592		sg_list.addr = ib_dma_map_single(qp_info->port_priv->device,
2593						 &mad_priv->grh,
2594						 sizeof *mad_priv -
2595						   sizeof mad_priv->header,
2596						 DMA_FROM_DEVICE);
 
 
 
 
 
 
2597		mad_priv->header.mapping = sg_list.addr;
2598		recv_wr.wr_id = (unsigned long)&mad_priv->header.mad_list;
2599		mad_priv->header.mad_list.mad_queue = recv_queue;
 
 
2600
2601		/* Post receive WR */
2602		spin_lock_irqsave(&recv_queue->lock, flags);
2603		post = (++recv_queue->count < recv_queue->max_active);
2604		list_add_tail(&mad_priv->header.mad_list.list, &recv_queue->list);
2605		spin_unlock_irqrestore(&recv_queue->lock, flags);
2606		ret = ib_post_recv(qp_info->qp, &recv_wr, &bad_recv_wr);
2607		if (ret) {
2608			spin_lock_irqsave(&recv_queue->lock, flags);
2609			list_del(&mad_priv->header.mad_list.list);
2610			recv_queue->count--;
2611			spin_unlock_irqrestore(&recv_queue->lock, flags);
2612			ib_dma_unmap_single(qp_info->port_priv->device,
2613					    mad_priv->header.mapping,
2614					    sizeof *mad_priv -
2615					      sizeof mad_priv->header,
2616					    DMA_FROM_DEVICE);
2617			kmem_cache_free(ib_mad_cache, mad_priv);
2618			printk(KERN_ERR PFX "ib_post_recv failed: %d\n", ret);
 
2619			break;
2620		}
2621	} while (post);
2622
2623	return ret;
2624}
2625
2626/*
2627 * Return all the posted receive MADs
2628 */
2629static void cleanup_recv_queue(struct ib_mad_qp_info *qp_info)
2630{
2631	struct ib_mad_private_header *mad_priv_hdr;
2632	struct ib_mad_private *recv;
2633	struct ib_mad_list_head *mad_list;
2634
2635	if (!qp_info->qp)
2636		return;
2637
2638	while (!list_empty(&qp_info->recv_queue.list)) {
2639
2640		mad_list = list_entry(qp_info->recv_queue.list.next,
2641				      struct ib_mad_list_head, list);
2642		mad_priv_hdr = container_of(mad_list,
2643					    struct ib_mad_private_header,
2644					    mad_list);
2645		recv = container_of(mad_priv_hdr, struct ib_mad_private,
2646				    header);
2647
2648		/* Remove from posted receive MAD list */
2649		list_del(&mad_list->list);
2650
2651		ib_dma_unmap_single(qp_info->port_priv->device,
2652				    recv->header.mapping,
2653				    sizeof(struct ib_mad_private) -
2654				      sizeof(struct ib_mad_private_header),
2655				    DMA_FROM_DEVICE);
2656		kmem_cache_free(ib_mad_cache, recv);
2657	}
2658
2659	qp_info->recv_queue.count = 0;
2660}
2661
2662/*
2663 * Start the port
2664 */
2665static int ib_mad_port_start(struct ib_mad_port_private *port_priv)
2666{
2667	int ret, i;
2668	struct ib_qp_attr *attr;
2669	struct ib_qp *qp;
 
2670
2671	attr = kmalloc(sizeof *attr, GFP_KERNEL);
2672	if (!attr) {
2673		printk(KERN_ERR PFX "Couldn't kmalloc ib_qp_attr\n");
2674		return -ENOMEM;
2675	}
 
 
 
 
2676
2677	for (i = 0; i < IB_MAD_QPS_CORE; i++) {
2678		qp = port_priv->qp_info[i].qp;
2679		if (!qp)
2680			continue;
2681
2682		/*
2683		 * PKey index for QP1 is irrelevant but
2684		 * one is needed for the Reset to Init transition
2685		 */
2686		attr->qp_state = IB_QPS_INIT;
2687		attr->pkey_index = 0;
2688		attr->qkey = (qp->qp_num == 0) ? 0 : IB_QP1_QKEY;
2689		ret = ib_modify_qp(qp, attr, IB_QP_STATE |
2690					     IB_QP_PKEY_INDEX | IB_QP_QKEY);
2691		if (ret) {
2692			printk(KERN_ERR PFX "Couldn't change QP%d state to "
2693			       "INIT: %d\n", i, ret);
 
2694			goto out;
2695		}
2696
2697		attr->qp_state = IB_QPS_RTR;
2698		ret = ib_modify_qp(qp, attr, IB_QP_STATE);
2699		if (ret) {
2700			printk(KERN_ERR PFX "Couldn't change QP%d state to "
2701			       "RTR: %d\n", i, ret);
 
2702			goto out;
2703		}
2704
2705		attr->qp_state = IB_QPS_RTS;
2706		attr->sq_psn = IB_MAD_SEND_Q_PSN;
2707		ret = ib_modify_qp(qp, attr, IB_QP_STATE | IB_QP_SQ_PSN);
2708		if (ret) {
2709			printk(KERN_ERR PFX "Couldn't change QP%d state to "
2710			       "RTS: %d\n", i, ret);
 
2711			goto out;
2712		}
2713	}
2714
2715	ret = ib_req_notify_cq(port_priv->cq, IB_CQ_NEXT_COMP);
2716	if (ret) {
2717		printk(KERN_ERR PFX "Failed to request completion "
2718		       "notification: %d\n", ret);
 
2719		goto out;
2720	}
2721
2722	for (i = 0; i < IB_MAD_QPS_CORE; i++) {
2723		if (!port_priv->qp_info[i].qp)
2724			continue;
2725
2726		ret = ib_mad_post_receive_mads(&port_priv->qp_info[i], NULL);
2727		if (ret) {
2728			printk(KERN_ERR PFX "Couldn't post receive WRs\n");
 
2729			goto out;
2730		}
2731	}
2732out:
2733	kfree(attr);
2734	return ret;
2735}
2736
2737static void qp_event_handler(struct ib_event *event, void *qp_context)
2738{
2739	struct ib_mad_qp_info	*qp_info = qp_context;
2740
2741	/* It's worse than that! He's dead, Jim! */
2742	printk(KERN_ERR PFX "Fatal error (%d) on MAD QP (%d)\n",
 
2743		event->event, qp_info->qp->qp_num);
2744}
2745
2746static void init_mad_queue(struct ib_mad_qp_info *qp_info,
2747			   struct ib_mad_queue *mad_queue)
2748{
2749	mad_queue->qp_info = qp_info;
2750	mad_queue->count = 0;
2751	spin_lock_init(&mad_queue->lock);
2752	INIT_LIST_HEAD(&mad_queue->list);
2753}
2754
2755static void init_mad_qp(struct ib_mad_port_private *port_priv,
2756			struct ib_mad_qp_info *qp_info)
2757{
2758	qp_info->port_priv = port_priv;
2759	init_mad_queue(qp_info, &qp_info->send_queue);
2760	init_mad_queue(qp_info, &qp_info->recv_queue);
2761	INIT_LIST_HEAD(&qp_info->overflow_list);
2762	spin_lock_init(&qp_info->snoop_lock);
2763	qp_info->snoop_table = NULL;
2764	qp_info->snoop_table_size = 0;
2765	atomic_set(&qp_info->snoop_count, 0);
2766}
2767
2768static int create_mad_qp(struct ib_mad_qp_info *qp_info,
2769			 enum ib_qp_type qp_type)
2770{
2771	struct ib_qp_init_attr	qp_init_attr;
2772	int ret;
2773
2774	memset(&qp_init_attr, 0, sizeof qp_init_attr);
2775	qp_init_attr.send_cq = qp_info->port_priv->cq;
2776	qp_init_attr.recv_cq = qp_info->port_priv->cq;
2777	qp_init_attr.sq_sig_type = IB_SIGNAL_ALL_WR;
2778	qp_init_attr.cap.max_send_wr = mad_sendq_size;
2779	qp_init_attr.cap.max_recv_wr = mad_recvq_size;
2780	qp_init_attr.cap.max_send_sge = IB_MAD_SEND_REQ_MAX_SG;
2781	qp_init_attr.cap.max_recv_sge = IB_MAD_RECV_REQ_MAX_SG;
2782	qp_init_attr.qp_type = qp_type;
2783	qp_init_attr.port_num = qp_info->port_priv->port_num;
2784	qp_init_attr.qp_context = qp_info;
2785	qp_init_attr.event_handler = qp_event_handler;
2786	qp_info->qp = ib_create_qp(qp_info->port_priv->pd, &qp_init_attr);
2787	if (IS_ERR(qp_info->qp)) {
2788		printk(KERN_ERR PFX "Couldn't create ib_mad QP%d\n",
2789		       get_spl_qp_index(qp_type));
 
2790		ret = PTR_ERR(qp_info->qp);
2791		goto error;
2792	}
2793	/* Use minimum queue sizes unless the CQ is resized */
2794	qp_info->send_queue.max_active = mad_sendq_size;
2795	qp_info->recv_queue.max_active = mad_recvq_size;
2796	return 0;
2797
2798error:
2799	return ret;
2800}
2801
2802static void destroy_mad_qp(struct ib_mad_qp_info *qp_info)
2803{
2804	if (!qp_info->qp)
2805		return;
2806
2807	ib_destroy_qp(qp_info->qp);
2808	kfree(qp_info->snoop_table);
2809}
2810
2811/*
2812 * Open the port
2813 * Create the QP, PD, MR, and CQ if needed
2814 */
2815static int ib_mad_port_open(struct ib_device *device,
2816			    int port_num)
2817{
2818	int ret, cq_size;
2819	struct ib_mad_port_private *port_priv;
2820	unsigned long flags;
2821	char name[sizeof "ib_mad123"];
2822	int has_smi;
2823
 
 
 
 
 
 
 
2824	/* Create new device info */
2825	port_priv = kzalloc(sizeof *port_priv, GFP_KERNEL);
2826	if (!port_priv) {
2827		printk(KERN_ERR PFX "No memory for ib_mad_port_private\n");
2828		return -ENOMEM;
2829	}
2830
2831	port_priv->device = device;
2832	port_priv->port_num = port_num;
2833	spin_lock_init(&port_priv->reg_lock);
2834	INIT_LIST_HEAD(&port_priv->agent_list);
2835	init_mad_qp(port_priv, &port_priv->qp_info[0]);
2836	init_mad_qp(port_priv, &port_priv->qp_info[1]);
2837
2838	cq_size = mad_sendq_size + mad_recvq_size;
2839	has_smi = rdma_port_get_link_layer(device, port_num) == IB_LINK_LAYER_INFINIBAND;
2840	if (has_smi)
2841		cq_size *= 2;
2842
2843	port_priv->cq = ib_create_cq(port_priv->device,
2844				     ib_mad_thread_completion_handler,
2845				     NULL, port_priv, cq_size, 0);
2846	if (IS_ERR(port_priv->cq)) {
2847		printk(KERN_ERR PFX "Couldn't create ib_mad CQ\n");
2848		ret = PTR_ERR(port_priv->cq);
2849		goto error3;
2850	}
2851
2852	port_priv->pd = ib_alloc_pd(device);
2853	if (IS_ERR(port_priv->pd)) {
2854		printk(KERN_ERR PFX "Couldn't create ib_mad PD\n");
2855		ret = PTR_ERR(port_priv->pd);
 
2856		goto error4;
2857	}
2858
2859	port_priv->mr = ib_get_dma_mr(port_priv->pd, IB_ACCESS_LOCAL_WRITE);
2860	if (IS_ERR(port_priv->mr)) {
2861		printk(KERN_ERR PFX "Couldn't get ib_mad DMA MR\n");
2862		ret = PTR_ERR(port_priv->mr);
2863		goto error5;
2864	}
2865
2866	if (has_smi) {
2867		ret = create_mad_qp(&port_priv->qp_info[0], IB_QPT_SMI);
2868		if (ret)
2869			goto error6;
2870	}
2871	ret = create_mad_qp(&port_priv->qp_info[1], IB_QPT_GSI);
2872	if (ret)
2873		goto error7;
2874
2875	snprintf(name, sizeof name, "ib_mad%d", port_num);
2876	port_priv->wq = create_singlethread_workqueue(name);
2877	if (!port_priv->wq) {
2878		ret = -ENOMEM;
2879		goto error8;
2880	}
2881	INIT_WORK(&port_priv->work, ib_mad_completion_handler);
2882
2883	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2884	list_add_tail(&port_priv->port_list, &ib_mad_port_list);
2885	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2886
2887	ret = ib_mad_port_start(port_priv);
2888	if (ret) {
2889		printk(KERN_ERR PFX "Couldn't start port\n");
2890		goto error9;
2891	}
2892
2893	return 0;
2894
2895error9:
2896	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2897	list_del_init(&port_priv->port_list);
2898	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2899
2900	destroy_workqueue(port_priv->wq);
2901error8:
2902	destroy_mad_qp(&port_priv->qp_info[1]);
2903error7:
2904	destroy_mad_qp(&port_priv->qp_info[0]);
2905error6:
2906	ib_dereg_mr(port_priv->mr);
2907error5:
2908	ib_dealloc_pd(port_priv->pd);
2909error4:
2910	ib_destroy_cq(port_priv->cq);
2911	cleanup_recv_queue(&port_priv->qp_info[1]);
2912	cleanup_recv_queue(&port_priv->qp_info[0]);
 
 
2913error3:
2914	kfree(port_priv);
2915
2916	return ret;
2917}
2918
2919/*
2920 * Close the port
2921 * If there are no classes using the port, free the port
2922 * resources (CQ, MR, PD, QP) and remove the port's info structure
2923 */
2924static int ib_mad_port_close(struct ib_device *device, int port_num)
2925{
2926	struct ib_mad_port_private *port_priv;
2927	unsigned long flags;
2928
2929	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2930	port_priv = __ib_get_mad_port(device, port_num);
2931	if (port_priv == NULL) {
2932		spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2933		printk(KERN_ERR PFX "Port %d not found\n", port_num);
2934		return -ENODEV;
2935	}
2936	list_del_init(&port_priv->port_list);
2937	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2938
2939	destroy_workqueue(port_priv->wq);
2940	destroy_mad_qp(&port_priv->qp_info[1]);
2941	destroy_mad_qp(&port_priv->qp_info[0]);
2942	ib_dereg_mr(port_priv->mr);
2943	ib_dealloc_pd(port_priv->pd);
2944	ib_destroy_cq(port_priv->cq);
2945	cleanup_recv_queue(&port_priv->qp_info[1]);
2946	cleanup_recv_queue(&port_priv->qp_info[0]);
2947	/* XXX: Handle deallocation of MAD registration tables */
2948
2949	kfree(port_priv);
2950
2951	return 0;
2952}
2953
2954static void ib_mad_init_device(struct ib_device *device)
2955{
2956	int start, end, i;
 
 
2957
2958	if (rdma_node_get_transport(device->node_type) != RDMA_TRANSPORT_IB)
2959		return;
2960
2961	if (device->node_type == RDMA_NODE_IB_SWITCH) {
2962		start = 0;
2963		end   = 0;
2964	} else {
2965		start = 1;
2966		end   = device->phys_port_cnt;
2967	}
2968
2969	for (i = start; i <= end; i++) {
2970		if (ib_mad_port_open(device, i)) {
2971			printk(KERN_ERR PFX "Couldn't open %s port %d\n",
2972			       device->name, i);
2973			goto error;
2974		}
2975		if (ib_agent_port_open(device, i)) {
2976			printk(KERN_ERR PFX "Couldn't open %s port %d "
2977			       "for agents\n",
2978			       device->name, i);
2979			goto error_agent;
2980		}
 
2981	}
2982	return;
 
 
 
2983
2984error_agent:
2985	if (ib_mad_port_close(device, i))
2986		printk(KERN_ERR PFX "Couldn't close %s port %d\n",
2987		       device->name, i);
2988
2989error:
2990	i--;
 
 
2991
2992	while (i >= start) {
2993		if (ib_agent_port_close(device, i))
2994			printk(KERN_ERR PFX "Couldn't close %s port %d "
2995			       "for agents\n",
2996			       device->name, i);
2997		if (ib_mad_port_close(device, i))
2998			printk(KERN_ERR PFX "Couldn't close %s port %d\n",
2999			       device->name, i);
3000		i--;
3001	}
 
3002}
3003
3004static void ib_mad_remove_device(struct ib_device *device)
3005{
3006	int i, num_ports, cur_port;
3007
3008	if (rdma_node_get_transport(device->node_type) != RDMA_TRANSPORT_IB)
3009		return;
 
3010
3011	if (device->node_type == RDMA_NODE_IB_SWITCH) {
3012		num_ports = 1;
3013		cur_port = 0;
3014	} else {
3015		num_ports = device->phys_port_cnt;
3016		cur_port = 1;
3017	}
3018	for (i = 0; i < num_ports; i++, cur_port++) {
3019		if (ib_agent_port_close(device, cur_port))
3020			printk(KERN_ERR PFX "Couldn't close %s port %d "
3021			       "for agents\n",
3022			       device->name, cur_port);
3023		if (ib_mad_port_close(device, cur_port))
3024			printk(KERN_ERR PFX "Couldn't close %s port %d\n",
3025			       device->name, cur_port);
3026	}
3027}
3028
3029static struct ib_client mad_client = {
3030	.name   = "mad",
3031	.add = ib_mad_init_device,
3032	.remove = ib_mad_remove_device
3033};
3034
3035static int __init ib_mad_init_module(void)
3036{
3037	int ret;
3038
3039	mad_recvq_size = min(mad_recvq_size, IB_MAD_QP_MAX_SIZE);
3040	mad_recvq_size = max(mad_recvq_size, IB_MAD_QP_MIN_SIZE);
3041
3042	mad_sendq_size = min(mad_sendq_size, IB_MAD_QP_MAX_SIZE);
3043	mad_sendq_size = max(mad_sendq_size, IB_MAD_QP_MIN_SIZE);
3044
3045	ib_mad_cache = kmem_cache_create("ib_mad",
3046					 sizeof(struct ib_mad_private),
3047					 0,
3048					 SLAB_HWCACHE_ALIGN,
3049					 NULL);
3050	if (!ib_mad_cache) {
3051		printk(KERN_ERR PFX "Couldn't create ib_mad cache\n");
3052		ret = -ENOMEM;
3053		goto error1;
3054	}
3055
3056	INIT_LIST_HEAD(&ib_mad_port_list);
3057
3058	if (ib_register_client(&mad_client)) {
3059		printk(KERN_ERR PFX "Couldn't register ib_mad client\n");
3060		ret = -EINVAL;
3061		goto error2;
3062	}
3063
3064	return 0;
3065
3066error2:
3067	kmem_cache_destroy(ib_mad_cache);
3068error1:
3069	return ret;
3070}
3071
3072static void __exit ib_mad_cleanup_module(void)
3073{
3074	ib_unregister_client(&mad_client);
3075	kmem_cache_destroy(ib_mad_cache);
3076}
3077
3078module_init(ib_mad_init_module);
3079module_exit(ib_mad_cleanup_module);