Linux Audio

Check our new training course

Loading...
v3.1
   1/*
   2 * Copyright (c) 2004-2007 Voltaire, Inc. All rights reserved.
   3 * Copyright (c) 2005 Intel Corporation.  All rights reserved.
   4 * Copyright (c) 2005 Mellanox Technologies Ltd.  All rights reserved.
   5 * Copyright (c) 2009 HNR Consulting. All rights reserved.
 
   6 *
   7 * This software is available to you under a choice of one of two
   8 * licenses.  You may choose to be licensed under the terms of the GNU
   9 * General Public License (GPL) Version 2, available from the file
  10 * COPYING in the main directory of this source tree, or the
  11 * OpenIB.org BSD license below:
  12 *
  13 *     Redistribution and use in source and binary forms, with or
  14 *     without modification, are permitted provided that the following
  15 *     conditions are met:
  16 *
  17 *      - Redistributions of source code must retain the above
  18 *        copyright notice, this list of conditions and the following
  19 *        disclaimer.
  20 *
  21 *      - Redistributions in binary form must reproduce the above
  22 *        copyright notice, this list of conditions and the following
  23 *        disclaimer in the documentation and/or other materials
  24 *        provided with the distribution.
  25 *
  26 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  27 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  28 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  29 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  30 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  31 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  32 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  33 * SOFTWARE.
  34 *
  35 */
 
 
 
  36#include <linux/dma-mapping.h>
  37#include <linux/slab.h>
 
 
  38#include <rdma/ib_cache.h>
  39
  40#include "mad_priv.h"
 
  41#include "mad_rmpp.h"
  42#include "smi.h"
 
  43#include "agent.h"
  44
  45MODULE_LICENSE("Dual BSD/GPL");
  46MODULE_DESCRIPTION("kernel IB MAD API");
  47MODULE_AUTHOR("Hal Rosenstock");
  48MODULE_AUTHOR("Sean Hefty");
  49
  50static int mad_sendq_size = IB_MAD_QP_SEND_SIZE;
  51static int mad_recvq_size = IB_MAD_QP_RECV_SIZE;
  52
  53module_param_named(send_queue_size, mad_sendq_size, int, 0444);
  54MODULE_PARM_DESC(send_queue_size, "Size of send queue in number of work requests");
  55module_param_named(recv_queue_size, mad_recvq_size, int, 0444);
  56MODULE_PARM_DESC(recv_queue_size, "Size of receive queue in number of work requests");
  57
  58static struct kmem_cache *ib_mad_cache;
  59
  60static struct list_head ib_mad_port_list;
  61static u32 ib_mad_client_id = 0;
  62
  63/* Port list lock */
  64static DEFINE_SPINLOCK(ib_mad_port_list_lock);
  65
  66/* Forward declarations */
  67static int method_in_use(struct ib_mad_mgmt_method_table **method,
  68			 struct ib_mad_reg_req *mad_reg_req);
  69static void remove_mad_reg_req(struct ib_mad_agent_private *priv);
  70static struct ib_mad_agent_private *find_mad_agent(
  71					struct ib_mad_port_private *port_priv,
  72					struct ib_mad *mad);
  73static int ib_mad_post_receive_mads(struct ib_mad_qp_info *qp_info,
  74				    struct ib_mad_private *mad);
  75static void cancel_mads(struct ib_mad_agent_private *mad_agent_priv);
  76static void timeout_sends(struct work_struct *work);
  77static void local_completions(struct work_struct *work);
  78static int add_nonoui_reg_req(struct ib_mad_reg_req *mad_reg_req,
  79			      struct ib_mad_agent_private *agent_priv,
  80			      u8 mgmt_class);
  81static int add_oui_reg_req(struct ib_mad_reg_req *mad_reg_req,
  82			   struct ib_mad_agent_private *agent_priv);
 
 
 
  83
  84/*
  85 * Returns a ib_mad_port_private structure or NULL for a device/port
  86 * Assumes ib_mad_port_list_lock is being held
  87 */
  88static inline struct ib_mad_port_private *
  89__ib_get_mad_port(struct ib_device *device, int port_num)
  90{
  91	struct ib_mad_port_private *entry;
  92
  93	list_for_each_entry(entry, &ib_mad_port_list, port_list) {
  94		if (entry->device == device && entry->port_num == port_num)
  95			return entry;
  96	}
  97	return NULL;
  98}
  99
 100/*
 101 * Wrapper function to return a ib_mad_port_private structure or NULL
 102 * for a device/port
 103 */
 104static inline struct ib_mad_port_private *
 105ib_get_mad_port(struct ib_device *device, int port_num)
 106{
 107	struct ib_mad_port_private *entry;
 108	unsigned long flags;
 109
 110	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
 111	entry = __ib_get_mad_port(device, port_num);
 112	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
 113
 114	return entry;
 115}
 116
 117static inline u8 convert_mgmt_class(u8 mgmt_class)
 118{
 119	/* Alias IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE to 0 */
 120	return mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE ?
 121		0 : mgmt_class;
 122}
 123
 124static int get_spl_qp_index(enum ib_qp_type qp_type)
 125{
 126	switch (qp_type)
 127	{
 128	case IB_QPT_SMI:
 129		return 0;
 130	case IB_QPT_GSI:
 131		return 1;
 132	default:
 133		return -1;
 134	}
 135}
 136
 137static int vendor_class_index(u8 mgmt_class)
 138{
 139	return mgmt_class - IB_MGMT_CLASS_VENDOR_RANGE2_START;
 140}
 141
 142static int is_vendor_class(u8 mgmt_class)
 143{
 144	if ((mgmt_class < IB_MGMT_CLASS_VENDOR_RANGE2_START) ||
 145	    (mgmt_class > IB_MGMT_CLASS_VENDOR_RANGE2_END))
 146		return 0;
 147	return 1;
 148}
 149
 150static int is_vendor_oui(char *oui)
 151{
 152	if (oui[0] || oui[1] || oui[2])
 153		return 1;
 154	return 0;
 155}
 156
 157static int is_vendor_method_in_use(
 158		struct ib_mad_mgmt_vendor_class *vendor_class,
 159		struct ib_mad_reg_req *mad_reg_req)
 160{
 161	struct ib_mad_mgmt_method_table *method;
 162	int i;
 163
 164	for (i = 0; i < MAX_MGMT_OUI; i++) {
 165		if (!memcmp(vendor_class->oui[i], mad_reg_req->oui, 3)) {
 166			method = vendor_class->method_table[i];
 167			if (method) {
 168				if (method_in_use(&method, mad_reg_req))
 169					return 1;
 170				else
 171					break;
 172			}
 173		}
 174	}
 175	return 0;
 176}
 177
 178int ib_response_mad(struct ib_mad *mad)
 179{
 180	return ((mad->mad_hdr.method & IB_MGMT_METHOD_RESP) ||
 181		(mad->mad_hdr.method == IB_MGMT_METHOD_TRAP_REPRESS) ||
 182		((mad->mad_hdr.mgmt_class == IB_MGMT_CLASS_BM) &&
 183		 (mad->mad_hdr.attr_mod & IB_BM_ATTR_MOD_RESP)));
 184}
 185EXPORT_SYMBOL(ib_response_mad);
 186
 187/*
 188 * ib_register_mad_agent - Register to send/receive MADs
 189 */
 190struct ib_mad_agent *ib_register_mad_agent(struct ib_device *device,
 191					   u8 port_num,
 192					   enum ib_qp_type qp_type,
 193					   struct ib_mad_reg_req *mad_reg_req,
 194					   u8 rmpp_version,
 195					   ib_mad_send_handler send_handler,
 196					   ib_mad_recv_handler recv_handler,
 197					   void *context)
 
 198{
 199	struct ib_mad_port_private *port_priv;
 200	struct ib_mad_agent *ret = ERR_PTR(-EINVAL);
 201	struct ib_mad_agent_private *mad_agent_priv;
 202	struct ib_mad_reg_req *reg_req = NULL;
 203	struct ib_mad_mgmt_class_table *class;
 204	struct ib_mad_mgmt_vendor_class_table *vendor;
 205	struct ib_mad_mgmt_vendor_class *vendor_class;
 206	struct ib_mad_mgmt_method_table *method;
 207	int ret2, qpn;
 208	unsigned long flags;
 209	u8 mgmt_class, vclass;
 210
 211	/* Validate parameters */
 212	qpn = get_spl_qp_index(qp_type);
 213	if (qpn == -1)
 
 
 
 214		goto error1;
 
 215
 216	if (rmpp_version && rmpp_version != IB_MGMT_RMPP_VERSION)
 
 
 
 217		goto error1;
 
 218
 219	/* Validate MAD registration request if supplied */
 220	if (mad_reg_req) {
 221		if (mad_reg_req->mgmt_class_version >= MAX_MGMT_VERSION)
 
 
 
 222			goto error1;
 223		if (!recv_handler)
 
 
 
 224			goto error1;
 
 225		if (mad_reg_req->mgmt_class >= MAX_MGMT_CLASS) {
 226			/*
 227			 * IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE is the only
 228			 * one in this range currently allowed
 229			 */
 230			if (mad_reg_req->mgmt_class !=
 231			    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)
 
 
 
 232				goto error1;
 
 233		} else if (mad_reg_req->mgmt_class == 0) {
 234			/*
 235			 * Class 0 is reserved in IBA and is used for
 236			 * aliasing of IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE
 237			 */
 
 
 238			goto error1;
 239		} else if (is_vendor_class(mad_reg_req->mgmt_class)) {
 240			/*
 241			 * If class is in "new" vendor range,
 242			 * ensure supplied OUI is not zero
 243			 */
 244			if (!is_vendor_oui(mad_reg_req->oui))
 
 
 
 245				goto error1;
 
 246		}
 247		/* Make sure class supplied is consistent with RMPP */
 248		if (!ib_is_mad_class_rmpp(mad_reg_req->mgmt_class)) {
 249			if (rmpp_version)
 
 
 
 250				goto error1;
 
 251		}
 
 252		/* Make sure class supplied is consistent with QP type */
 253		if (qp_type == IB_QPT_SMI) {
 254			if ((mad_reg_req->mgmt_class !=
 255					IB_MGMT_CLASS_SUBN_LID_ROUTED) &&
 256			    (mad_reg_req->mgmt_class !=
 257					IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE))
 
 
 
 258				goto error1;
 
 259		} else {
 260			if ((mad_reg_req->mgmt_class ==
 261					IB_MGMT_CLASS_SUBN_LID_ROUTED) ||
 262			    (mad_reg_req->mgmt_class ==
 263					IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE))
 
 
 
 264				goto error1;
 
 265		}
 266	} else {
 267		/* No registration request supplied */
 268		if (!send_handler)
 269			goto error1;
 
 
 270	}
 271
 272	/* Validate device and port */
 273	port_priv = ib_get_mad_port(device, port_num);
 274	if (!port_priv) {
 
 
 
 275		ret = ERR_PTR(-ENODEV);
 276		goto error1;
 277	}
 278
 279	/* Verify the QP requested is supported.  For example, Ethernet devices
 280	 * will not have QP0 */
 281	if (!port_priv->qp_info[qpn].qp) {
 
 
 282		ret = ERR_PTR(-EPROTONOSUPPORT);
 283		goto error1;
 284	}
 285
 286	/* Allocate structures */
 287	mad_agent_priv = kzalloc(sizeof *mad_agent_priv, GFP_KERNEL);
 288	if (!mad_agent_priv) {
 289		ret = ERR_PTR(-ENOMEM);
 290		goto error1;
 291	}
 292
 293	mad_agent_priv->agent.mr = ib_get_dma_mr(port_priv->qp_info[qpn].qp->pd,
 294						 IB_ACCESS_LOCAL_WRITE);
 295	if (IS_ERR(mad_agent_priv->agent.mr)) {
 296		ret = ERR_PTR(-ENOMEM);
 297		goto error2;
 298	}
 299
 300	if (mad_reg_req) {
 301		reg_req = kmemdup(mad_reg_req, sizeof *reg_req, GFP_KERNEL);
 302		if (!reg_req) {
 303			ret = ERR_PTR(-ENOMEM);
 304			goto error3;
 305		}
 306	}
 307
 308	/* Now, fill in the various structures */
 309	mad_agent_priv->qp_info = &port_priv->qp_info[qpn];
 310	mad_agent_priv->reg_req = reg_req;
 311	mad_agent_priv->agent.rmpp_version = rmpp_version;
 312	mad_agent_priv->agent.device = device;
 313	mad_agent_priv->agent.recv_handler = recv_handler;
 314	mad_agent_priv->agent.send_handler = send_handler;
 315	mad_agent_priv->agent.context = context;
 316	mad_agent_priv->agent.qp = port_priv->qp_info[qpn].qp;
 317	mad_agent_priv->agent.port_num = port_num;
 
 318	spin_lock_init(&mad_agent_priv->lock);
 319	INIT_LIST_HEAD(&mad_agent_priv->send_list);
 320	INIT_LIST_HEAD(&mad_agent_priv->wait_list);
 321	INIT_LIST_HEAD(&mad_agent_priv->done_list);
 322	INIT_LIST_HEAD(&mad_agent_priv->rmpp_list);
 323	INIT_DELAYED_WORK(&mad_agent_priv->timed_work, timeout_sends);
 324	INIT_LIST_HEAD(&mad_agent_priv->local_list);
 325	INIT_WORK(&mad_agent_priv->local_work, local_completions);
 326	atomic_set(&mad_agent_priv->refcount, 1);
 327	init_completion(&mad_agent_priv->comp);
 328
 
 
 
 
 
 
 329	spin_lock_irqsave(&port_priv->reg_lock, flags);
 330	mad_agent_priv->agent.hi_tid = ++ib_mad_client_id;
 331
 332	/*
 333	 * Make sure MAD registration (if supplied)
 334	 * is non overlapping with any existing ones
 335	 */
 336	if (mad_reg_req) {
 337		mgmt_class = convert_mgmt_class(mad_reg_req->mgmt_class);
 338		if (!is_vendor_class(mgmt_class)) {
 339			class = port_priv->version[mad_reg_req->
 340						   mgmt_class_version].class;
 341			if (class) {
 342				method = class->method_table[mgmt_class];
 343				if (method) {
 344					if (method_in_use(&method,
 345							   mad_reg_req))
 346						goto error4;
 347				}
 348			}
 349			ret2 = add_nonoui_reg_req(mad_reg_req, mad_agent_priv,
 350						  mgmt_class);
 351		} else {
 352			/* "New" vendor class range */
 353			vendor = port_priv->version[mad_reg_req->
 354						    mgmt_class_version].vendor;
 355			if (vendor) {
 356				vclass = vendor_class_index(mgmt_class);
 357				vendor_class = vendor->vendor_class[vclass];
 358				if (vendor_class) {
 359					if (is_vendor_method_in_use(
 360							vendor_class,
 361							mad_reg_req))
 362						goto error4;
 363				}
 364			}
 365			ret2 = add_oui_reg_req(mad_reg_req, mad_agent_priv);
 366		}
 367		if (ret2) {
 368			ret = ERR_PTR(ret2);
 369			goto error4;
 370		}
 371	}
 372
 373	/* Add mad agent into port's agent list */
 374	list_add_tail(&mad_agent_priv->agent_list, &port_priv->agent_list);
 375	spin_unlock_irqrestore(&port_priv->reg_lock, flags);
 376
 377	return &mad_agent_priv->agent;
 378
 379error4:
 380	spin_unlock_irqrestore(&port_priv->reg_lock, flags);
 
 
 381	kfree(reg_req);
 382error3:
 383	ib_dereg_mr(mad_agent_priv->agent.mr);
 384error2:
 385	kfree(mad_agent_priv);
 386error1:
 387	return ret;
 388}
 389EXPORT_SYMBOL(ib_register_mad_agent);
 390
 391static inline int is_snooping_sends(int mad_snoop_flags)
 392{
 393	return (mad_snoop_flags &
 394		(/*IB_MAD_SNOOP_POSTED_SENDS |
 395		 IB_MAD_SNOOP_RMPP_SENDS |*/
 396		 IB_MAD_SNOOP_SEND_COMPLETIONS /*|
 397		 IB_MAD_SNOOP_RMPP_SEND_COMPLETIONS*/));
 398}
 399
 400static inline int is_snooping_recvs(int mad_snoop_flags)
 401{
 402	return (mad_snoop_flags &
 403		(IB_MAD_SNOOP_RECVS /*|
 404		 IB_MAD_SNOOP_RMPP_RECVS*/));
 405}
 406
 407static int register_snoop_agent(struct ib_mad_qp_info *qp_info,
 408				struct ib_mad_snoop_private *mad_snoop_priv)
 409{
 410	struct ib_mad_snoop_private **new_snoop_table;
 411	unsigned long flags;
 412	int i;
 413
 414	spin_lock_irqsave(&qp_info->snoop_lock, flags);
 415	/* Check for empty slot in array. */
 416	for (i = 0; i < qp_info->snoop_table_size; i++)
 417		if (!qp_info->snoop_table[i])
 418			break;
 419
 420	if (i == qp_info->snoop_table_size) {
 421		/* Grow table. */
 422		new_snoop_table = krealloc(qp_info->snoop_table,
 423					   sizeof mad_snoop_priv *
 424					   (qp_info->snoop_table_size + 1),
 425					   GFP_ATOMIC);
 426		if (!new_snoop_table) {
 427			i = -ENOMEM;
 428			goto out;
 429		}
 430
 431		qp_info->snoop_table = new_snoop_table;
 432		qp_info->snoop_table_size++;
 433	}
 434	qp_info->snoop_table[i] = mad_snoop_priv;
 435	atomic_inc(&qp_info->snoop_count);
 436out:
 437	spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 438	return i;
 439}
 440
 441struct ib_mad_agent *ib_register_mad_snoop(struct ib_device *device,
 442					   u8 port_num,
 443					   enum ib_qp_type qp_type,
 444					   int mad_snoop_flags,
 445					   ib_mad_snoop_handler snoop_handler,
 446					   ib_mad_recv_handler recv_handler,
 447					   void *context)
 448{
 449	struct ib_mad_port_private *port_priv;
 450	struct ib_mad_agent *ret;
 451	struct ib_mad_snoop_private *mad_snoop_priv;
 452	int qpn;
 
 453
 454	/* Validate parameters */
 455	if ((is_snooping_sends(mad_snoop_flags) && !snoop_handler) ||
 456	    (is_snooping_recvs(mad_snoop_flags) && !recv_handler)) {
 457		ret = ERR_PTR(-EINVAL);
 458		goto error1;
 459	}
 460	qpn = get_spl_qp_index(qp_type);
 461	if (qpn == -1) {
 462		ret = ERR_PTR(-EINVAL);
 463		goto error1;
 464	}
 465	port_priv = ib_get_mad_port(device, port_num);
 466	if (!port_priv) {
 467		ret = ERR_PTR(-ENODEV);
 468		goto error1;
 469	}
 470	/* Allocate structures */
 471	mad_snoop_priv = kzalloc(sizeof *mad_snoop_priv, GFP_KERNEL);
 472	if (!mad_snoop_priv) {
 473		ret = ERR_PTR(-ENOMEM);
 474		goto error1;
 475	}
 476
 477	/* Now, fill in the various structures */
 478	mad_snoop_priv->qp_info = &port_priv->qp_info[qpn];
 479	mad_snoop_priv->agent.device = device;
 480	mad_snoop_priv->agent.recv_handler = recv_handler;
 481	mad_snoop_priv->agent.snoop_handler = snoop_handler;
 482	mad_snoop_priv->agent.context = context;
 483	mad_snoop_priv->agent.qp = port_priv->qp_info[qpn].qp;
 484	mad_snoop_priv->agent.port_num = port_num;
 485	mad_snoop_priv->mad_snoop_flags = mad_snoop_flags;
 486	init_completion(&mad_snoop_priv->comp);
 
 
 
 
 
 
 
 487	mad_snoop_priv->snoop_index = register_snoop_agent(
 488						&port_priv->qp_info[qpn],
 489						mad_snoop_priv);
 490	if (mad_snoop_priv->snoop_index < 0) {
 491		ret = ERR_PTR(mad_snoop_priv->snoop_index);
 492		goto error2;
 493	}
 494
 495	atomic_set(&mad_snoop_priv->refcount, 1);
 496	return &mad_snoop_priv->agent;
 497
 
 498error2:
 499	kfree(mad_snoop_priv);
 500error1:
 501	return ret;
 502}
 503EXPORT_SYMBOL(ib_register_mad_snoop);
 504
 505static inline void deref_mad_agent(struct ib_mad_agent_private *mad_agent_priv)
 506{
 507	if (atomic_dec_and_test(&mad_agent_priv->refcount))
 508		complete(&mad_agent_priv->comp);
 509}
 510
 511static inline void deref_snoop_agent(struct ib_mad_snoop_private *mad_snoop_priv)
 512{
 513	if (atomic_dec_and_test(&mad_snoop_priv->refcount))
 514		complete(&mad_snoop_priv->comp);
 515}
 516
 517static void unregister_mad_agent(struct ib_mad_agent_private *mad_agent_priv)
 518{
 519	struct ib_mad_port_private *port_priv;
 520	unsigned long flags;
 521
 522	/* Note that we could still be handling received MADs */
 523
 524	/*
 525	 * Canceling all sends results in dropping received response
 526	 * MADs, preventing us from queuing additional work
 527	 */
 528	cancel_mads(mad_agent_priv);
 529	port_priv = mad_agent_priv->qp_info->port_priv;
 530	cancel_delayed_work(&mad_agent_priv->timed_work);
 531
 532	spin_lock_irqsave(&port_priv->reg_lock, flags);
 533	remove_mad_reg_req(mad_agent_priv);
 534	list_del(&mad_agent_priv->agent_list);
 535	spin_unlock_irqrestore(&port_priv->reg_lock, flags);
 536
 537	flush_workqueue(port_priv->wq);
 538	ib_cancel_rmpp_recvs(mad_agent_priv);
 539
 540	deref_mad_agent(mad_agent_priv);
 541	wait_for_completion(&mad_agent_priv->comp);
 542
 
 
 543	kfree(mad_agent_priv->reg_req);
 544	ib_dereg_mr(mad_agent_priv->agent.mr);
 545	kfree(mad_agent_priv);
 546}
 547
 548static void unregister_mad_snoop(struct ib_mad_snoop_private *mad_snoop_priv)
 549{
 550	struct ib_mad_qp_info *qp_info;
 551	unsigned long flags;
 552
 553	qp_info = mad_snoop_priv->qp_info;
 554	spin_lock_irqsave(&qp_info->snoop_lock, flags);
 555	qp_info->snoop_table[mad_snoop_priv->snoop_index] = NULL;
 556	atomic_dec(&qp_info->snoop_count);
 557	spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 558
 559	deref_snoop_agent(mad_snoop_priv);
 560	wait_for_completion(&mad_snoop_priv->comp);
 561
 
 
 562	kfree(mad_snoop_priv);
 563}
 564
 565/*
 566 * ib_unregister_mad_agent - Unregisters a client from using MAD services
 567 */
 568int ib_unregister_mad_agent(struct ib_mad_agent *mad_agent)
 569{
 570	struct ib_mad_agent_private *mad_agent_priv;
 571	struct ib_mad_snoop_private *mad_snoop_priv;
 572
 573	/* If the TID is zero, the agent can only snoop. */
 574	if (mad_agent->hi_tid) {
 575		mad_agent_priv = container_of(mad_agent,
 576					      struct ib_mad_agent_private,
 577					      agent);
 578		unregister_mad_agent(mad_agent_priv);
 579	} else {
 580		mad_snoop_priv = container_of(mad_agent,
 581					      struct ib_mad_snoop_private,
 582					      agent);
 583		unregister_mad_snoop(mad_snoop_priv);
 584	}
 585	return 0;
 586}
 587EXPORT_SYMBOL(ib_unregister_mad_agent);
 588
 589static void dequeue_mad(struct ib_mad_list_head *mad_list)
 590{
 591	struct ib_mad_queue *mad_queue;
 592	unsigned long flags;
 593
 594	BUG_ON(!mad_list->mad_queue);
 595	mad_queue = mad_list->mad_queue;
 596	spin_lock_irqsave(&mad_queue->lock, flags);
 597	list_del(&mad_list->list);
 598	mad_queue->count--;
 599	spin_unlock_irqrestore(&mad_queue->lock, flags);
 600}
 601
 602static void snoop_send(struct ib_mad_qp_info *qp_info,
 603		       struct ib_mad_send_buf *send_buf,
 604		       struct ib_mad_send_wc *mad_send_wc,
 605		       int mad_snoop_flags)
 606{
 607	struct ib_mad_snoop_private *mad_snoop_priv;
 608	unsigned long flags;
 609	int i;
 610
 611	spin_lock_irqsave(&qp_info->snoop_lock, flags);
 612	for (i = 0; i < qp_info->snoop_table_size; i++) {
 613		mad_snoop_priv = qp_info->snoop_table[i];
 614		if (!mad_snoop_priv ||
 615		    !(mad_snoop_priv->mad_snoop_flags & mad_snoop_flags))
 616			continue;
 617
 618		atomic_inc(&mad_snoop_priv->refcount);
 619		spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 620		mad_snoop_priv->agent.snoop_handler(&mad_snoop_priv->agent,
 621						    send_buf, mad_send_wc);
 622		deref_snoop_agent(mad_snoop_priv);
 623		spin_lock_irqsave(&qp_info->snoop_lock, flags);
 624	}
 625	spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 626}
 627
 628static void snoop_recv(struct ib_mad_qp_info *qp_info,
 629		       struct ib_mad_recv_wc *mad_recv_wc,
 630		       int mad_snoop_flags)
 631{
 632	struct ib_mad_snoop_private *mad_snoop_priv;
 633	unsigned long flags;
 634	int i;
 635
 636	spin_lock_irqsave(&qp_info->snoop_lock, flags);
 637	for (i = 0; i < qp_info->snoop_table_size; i++) {
 638		mad_snoop_priv = qp_info->snoop_table[i];
 639		if (!mad_snoop_priv ||
 640		    !(mad_snoop_priv->mad_snoop_flags & mad_snoop_flags))
 641			continue;
 642
 643		atomic_inc(&mad_snoop_priv->refcount);
 644		spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 645		mad_snoop_priv->agent.recv_handler(&mad_snoop_priv->agent,
 646						   mad_recv_wc);
 647		deref_snoop_agent(mad_snoop_priv);
 648		spin_lock_irqsave(&qp_info->snoop_lock, flags);
 649	}
 650	spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 651}
 652
 653static void build_smp_wc(struct ib_qp *qp,
 654			 u64 wr_id, u16 slid, u16 pkey_index, u8 port_num,
 655			 struct ib_wc *wc)
 656{
 657	memset(wc, 0, sizeof *wc);
 658	wc->wr_id = wr_id;
 659	wc->status = IB_WC_SUCCESS;
 660	wc->opcode = IB_WC_RECV;
 661	wc->pkey_index = pkey_index;
 662	wc->byte_len = sizeof(struct ib_mad) + sizeof(struct ib_grh);
 663	wc->src_qp = IB_QP0;
 664	wc->qp = qp;
 665	wc->slid = slid;
 666	wc->sl = 0;
 667	wc->dlid_path_bits = 0;
 668	wc->port_num = port_num;
 669}
 670
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 671/*
 672 * Return 0 if SMP is to be sent
 673 * Return 1 if SMP was consumed locally (whether or not solicited)
 674 * Return < 0 if error
 675 */
 676static int handle_outgoing_dr_smp(struct ib_mad_agent_private *mad_agent_priv,
 677				  struct ib_mad_send_wr_private *mad_send_wr)
 678{
 679	int ret = 0;
 680	struct ib_smp *smp = mad_send_wr->send_buf.mad;
 
 681	unsigned long flags;
 682	struct ib_mad_local_private *local;
 683	struct ib_mad_private *mad_priv;
 684	struct ib_mad_port_private *port_priv;
 685	struct ib_mad_agent_private *recv_mad_agent = NULL;
 686	struct ib_device *device = mad_agent_priv->agent.device;
 687	u8 port_num;
 688	struct ib_wc mad_wc;
 689	struct ib_send_wr *send_wr = &mad_send_wr->send_wr;
 
 
 
 
 
 690
 691	if (device->node_type == RDMA_NODE_IB_SWITCH &&
 692	    smp->mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)
 693		port_num = send_wr->wr.ud.port_num;
 694	else
 695		port_num = mad_agent_priv->agent.port_num;
 696
 697	/*
 698	 * Directed route handling starts if the initial LID routed part of
 699	 * a request or the ending LID routed part of a response is empty.
 700	 * If we are at the start of the LID routed part, don't update the
 701	 * hop_ptr or hop_cnt.  See section 14.2.2, Vol 1 IB spec.
 702	 */
 703	if ((ib_get_smp_direction(smp) ? smp->dr_dlid : smp->dr_slid) ==
 704	     IB_LID_PERMISSIVE &&
 705	     smi_handle_dr_smp_send(smp, device->node_type, port_num) ==
 706	     IB_SMI_DISCARD) {
 707		ret = -EINVAL;
 708		printk(KERN_ERR PFX "Invalid directed route\n");
 709		goto out;
 710	}
 711
 712	/* Check to post send on QP or process locally */
 713	if (smi_check_local_smp(smp, device) == IB_SMI_DISCARD &&
 714	    smi_check_local_returning_smp(smp, device) == IB_SMI_DISCARD)
 715		goto out;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 716
 717	local = kmalloc(sizeof *local, GFP_ATOMIC);
 718	if (!local) {
 719		ret = -ENOMEM;
 720		printk(KERN_ERR PFX "No memory for ib_mad_local_private\n");
 721		goto out;
 722	}
 723	local->mad_priv = NULL;
 724	local->recv_mad_agent = NULL;
 725	mad_priv = kmem_cache_alloc(ib_mad_cache, GFP_ATOMIC);
 726	if (!mad_priv) {
 727		ret = -ENOMEM;
 728		printk(KERN_ERR PFX "No memory for local response MAD\n");
 729		kfree(local);
 730		goto out;
 731	}
 732
 733	build_smp_wc(mad_agent_priv->agent.qp,
 734		     send_wr->wr_id, be16_to_cpu(smp->dr_slid),
 735		     send_wr->wr.ud.pkey_index,
 736		     send_wr->wr.ud.port_num, &mad_wc);
 
 
 
 
 
 
 737
 738	/* No GRH for DR SMP */
 739	ret = device->process_mad(device, 0, port_num, &mad_wc, NULL,
 740				  (struct ib_mad *)smp,
 741				  (struct ib_mad *)&mad_priv->mad);
 
 742	switch (ret)
 743	{
 744	case IB_MAD_RESULT_SUCCESS | IB_MAD_RESULT_REPLY:
 745		if (ib_response_mad(&mad_priv->mad.mad) &&
 746		    mad_agent_priv->agent.recv_handler) {
 747			local->mad_priv = mad_priv;
 748			local->recv_mad_agent = mad_agent_priv;
 749			/*
 750			 * Reference MAD agent until receive
 751			 * side of local completion handled
 752			 */
 753			atomic_inc(&mad_agent_priv->refcount);
 754		} else
 755			kmem_cache_free(ib_mad_cache, mad_priv);
 756		break;
 757	case IB_MAD_RESULT_SUCCESS | IB_MAD_RESULT_CONSUMED:
 758		kmem_cache_free(ib_mad_cache, mad_priv);
 759		break;
 760	case IB_MAD_RESULT_SUCCESS:
 761		/* Treat like an incoming receive MAD */
 762		port_priv = ib_get_mad_port(mad_agent_priv->agent.device,
 763					    mad_agent_priv->agent.port_num);
 764		if (port_priv) {
 765			memcpy(&mad_priv->mad.mad, smp, sizeof(struct ib_mad));
 766			recv_mad_agent = find_mad_agent(port_priv,
 767						        &mad_priv->mad.mad);
 768		}
 769		if (!port_priv || !recv_mad_agent) {
 770			/*
 771			 * No receiving agent so drop packet and
 772			 * generate send completion.
 773			 */
 774			kmem_cache_free(ib_mad_cache, mad_priv);
 775			break;
 776		}
 777		local->mad_priv = mad_priv;
 778		local->recv_mad_agent = recv_mad_agent;
 779		break;
 780	default:
 781		kmem_cache_free(ib_mad_cache, mad_priv);
 782		kfree(local);
 783		ret = -EINVAL;
 784		goto out;
 785	}
 786
 787	local->mad_send_wr = mad_send_wr;
 
 
 
 
 788	/* Reference MAD agent until send side of local completion handled */
 789	atomic_inc(&mad_agent_priv->refcount);
 790	/* Queue local completion to local list */
 791	spin_lock_irqsave(&mad_agent_priv->lock, flags);
 792	list_add_tail(&local->completion_list, &mad_agent_priv->local_list);
 793	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
 794	queue_work(mad_agent_priv->qp_info->port_priv->wq,
 795		   &mad_agent_priv->local_work);
 796	ret = 1;
 797out:
 798	return ret;
 799}
 800
 801static int get_pad_size(int hdr_len, int data_len)
 802{
 803	int seg_size, pad;
 804
 805	seg_size = sizeof(struct ib_mad) - hdr_len;
 806	if (data_len && seg_size) {
 807		pad = seg_size - data_len % seg_size;
 808		return pad == seg_size ? 0 : pad;
 809	} else
 810		return seg_size;
 811}
 812
 813static void free_send_rmpp_list(struct ib_mad_send_wr_private *mad_send_wr)
 814{
 815	struct ib_rmpp_segment *s, *t;
 816
 817	list_for_each_entry_safe(s, t, &mad_send_wr->rmpp_list, list) {
 818		list_del(&s->list);
 819		kfree(s);
 820	}
 821}
 822
 823static int alloc_send_rmpp_list(struct ib_mad_send_wr_private *send_wr,
 824				gfp_t gfp_mask)
 825{
 826	struct ib_mad_send_buf *send_buf = &send_wr->send_buf;
 827	struct ib_rmpp_mad *rmpp_mad = send_buf->mad;
 828	struct ib_rmpp_segment *seg = NULL;
 829	int left, seg_size, pad;
 830
 831	send_buf->seg_size = sizeof (struct ib_mad) - send_buf->hdr_len;
 
 832	seg_size = send_buf->seg_size;
 833	pad = send_wr->pad;
 834
 835	/* Allocate data segments. */
 836	for (left = send_buf->data_len + pad; left > 0; left -= seg_size) {
 837		seg = kmalloc(sizeof (*seg) + seg_size, gfp_mask);
 838		if (!seg) {
 839			printk(KERN_ERR "alloc_send_rmpp_segs: RMPP mem "
 840			       "alloc failed for len %zd, gfp %#x\n",
 841			       sizeof (*seg) + seg_size, gfp_mask);
 842			free_send_rmpp_list(send_wr);
 843			return -ENOMEM;
 844		}
 845		seg->num = ++send_buf->seg_count;
 846		list_add_tail(&seg->list, &send_wr->rmpp_list);
 847	}
 848
 849	/* Zero any padding */
 850	if (pad)
 851		memset(seg->data + seg_size - pad, 0, pad);
 852
 853	rmpp_mad->rmpp_hdr.rmpp_version = send_wr->mad_agent_priv->
 854					  agent.rmpp_version;
 855	rmpp_mad->rmpp_hdr.rmpp_type = IB_MGMT_RMPP_TYPE_DATA;
 856	ib_set_rmpp_flags(&rmpp_mad->rmpp_hdr, IB_MGMT_RMPP_FLAG_ACTIVE);
 857
 858	send_wr->cur_seg = container_of(send_wr->rmpp_list.next,
 859					struct ib_rmpp_segment, list);
 860	send_wr->last_ack_seg = send_wr->cur_seg;
 861	return 0;
 862}
 863
 
 
 
 
 
 
 864struct ib_mad_send_buf * ib_create_send_mad(struct ib_mad_agent *mad_agent,
 865					    u32 remote_qpn, u16 pkey_index,
 866					    int rmpp_active,
 867					    int hdr_len, int data_len,
 868					    gfp_t gfp_mask)
 
 869{
 870	struct ib_mad_agent_private *mad_agent_priv;
 871	struct ib_mad_send_wr_private *mad_send_wr;
 872	int pad, message_size, ret, size;
 873	void *buf;
 
 
 874
 875	mad_agent_priv = container_of(mad_agent, struct ib_mad_agent_private,
 876				      agent);
 877	pad = get_pad_size(hdr_len, data_len);
 
 
 
 
 
 
 
 
 878	message_size = hdr_len + data_len + pad;
 879
 880	if ((!mad_agent->rmpp_version &&
 881	     (rmpp_active || message_size > sizeof(struct ib_mad))) ||
 882	    (!rmpp_active && message_size > sizeof(struct ib_mad)))
 883		return ERR_PTR(-EINVAL);
 
 
 884
 885	size = rmpp_active ? hdr_len : sizeof(struct ib_mad);
 886	buf = kzalloc(sizeof *mad_send_wr + size, gfp_mask);
 887	if (!buf)
 888		return ERR_PTR(-ENOMEM);
 889
 890	mad_send_wr = buf + size;
 891	INIT_LIST_HEAD(&mad_send_wr->rmpp_list);
 892	mad_send_wr->send_buf.mad = buf;
 893	mad_send_wr->send_buf.hdr_len = hdr_len;
 894	mad_send_wr->send_buf.data_len = data_len;
 895	mad_send_wr->pad = pad;
 896
 897	mad_send_wr->mad_agent_priv = mad_agent_priv;
 898	mad_send_wr->sg_list[0].length = hdr_len;
 899	mad_send_wr->sg_list[0].lkey = mad_agent->mr->lkey;
 900	mad_send_wr->sg_list[1].length = sizeof(struct ib_mad) - hdr_len;
 901	mad_send_wr->sg_list[1].lkey = mad_agent->mr->lkey;
 902
 903	mad_send_wr->send_wr.wr_id = (unsigned long) mad_send_wr;
 904	mad_send_wr->send_wr.sg_list = mad_send_wr->sg_list;
 905	mad_send_wr->send_wr.num_sge = 2;
 906	mad_send_wr->send_wr.opcode = IB_WR_SEND;
 907	mad_send_wr->send_wr.send_flags = IB_SEND_SIGNALED;
 908	mad_send_wr->send_wr.wr.ud.remote_qpn = remote_qpn;
 909	mad_send_wr->send_wr.wr.ud.remote_qkey = IB_QP_SET_QKEY;
 910	mad_send_wr->send_wr.wr.ud.pkey_index = pkey_index;
 
 
 
 
 
 
 
 
 
 911
 912	if (rmpp_active) {
 913		ret = alloc_send_rmpp_list(mad_send_wr, gfp_mask);
 914		if (ret) {
 915			kfree(buf);
 916			return ERR_PTR(ret);
 917		}
 918	}
 919
 920	mad_send_wr->send_buf.mad_agent = mad_agent;
 921	atomic_inc(&mad_agent_priv->refcount);
 922	return &mad_send_wr->send_buf;
 923}
 924EXPORT_SYMBOL(ib_create_send_mad);
 925
 926int ib_get_mad_data_offset(u8 mgmt_class)
 927{
 928	if (mgmt_class == IB_MGMT_CLASS_SUBN_ADM)
 929		return IB_MGMT_SA_HDR;
 930	else if ((mgmt_class == IB_MGMT_CLASS_DEVICE_MGMT) ||
 931		 (mgmt_class == IB_MGMT_CLASS_DEVICE_ADM) ||
 932		 (mgmt_class == IB_MGMT_CLASS_BIS))
 933		return IB_MGMT_DEVICE_HDR;
 934	else if ((mgmt_class >= IB_MGMT_CLASS_VENDOR_RANGE2_START) &&
 935		 (mgmt_class <= IB_MGMT_CLASS_VENDOR_RANGE2_END))
 936		return IB_MGMT_VENDOR_HDR;
 937	else
 938		return IB_MGMT_MAD_HDR;
 939}
 940EXPORT_SYMBOL(ib_get_mad_data_offset);
 941
 942int ib_is_mad_class_rmpp(u8 mgmt_class)
 943{
 944	if ((mgmt_class == IB_MGMT_CLASS_SUBN_ADM) ||
 945	    (mgmt_class == IB_MGMT_CLASS_DEVICE_MGMT) ||
 946	    (mgmt_class == IB_MGMT_CLASS_DEVICE_ADM) ||
 947	    (mgmt_class == IB_MGMT_CLASS_BIS) ||
 948	    ((mgmt_class >= IB_MGMT_CLASS_VENDOR_RANGE2_START) &&
 949	     (mgmt_class <= IB_MGMT_CLASS_VENDOR_RANGE2_END)))
 950		return 1;
 951	return 0;
 952}
 953EXPORT_SYMBOL(ib_is_mad_class_rmpp);
 954
 955void *ib_get_rmpp_segment(struct ib_mad_send_buf *send_buf, int seg_num)
 956{
 957	struct ib_mad_send_wr_private *mad_send_wr;
 958	struct list_head *list;
 959
 960	mad_send_wr = container_of(send_buf, struct ib_mad_send_wr_private,
 961				   send_buf);
 962	list = &mad_send_wr->cur_seg->list;
 963
 964	if (mad_send_wr->cur_seg->num < seg_num) {
 965		list_for_each_entry(mad_send_wr->cur_seg, list, list)
 966			if (mad_send_wr->cur_seg->num == seg_num)
 967				break;
 968	} else if (mad_send_wr->cur_seg->num > seg_num) {
 969		list_for_each_entry_reverse(mad_send_wr->cur_seg, list, list)
 970			if (mad_send_wr->cur_seg->num == seg_num)
 971				break;
 972	}
 973	return mad_send_wr->cur_seg->data;
 974}
 975EXPORT_SYMBOL(ib_get_rmpp_segment);
 976
 977static inline void *ib_get_payload(struct ib_mad_send_wr_private *mad_send_wr)
 978{
 979	if (mad_send_wr->send_buf.seg_count)
 980		return ib_get_rmpp_segment(&mad_send_wr->send_buf,
 981					   mad_send_wr->seg_num);
 982	else
 983		return mad_send_wr->send_buf.mad +
 984		       mad_send_wr->send_buf.hdr_len;
 985}
 986
 987void ib_free_send_mad(struct ib_mad_send_buf *send_buf)
 988{
 989	struct ib_mad_agent_private *mad_agent_priv;
 990	struct ib_mad_send_wr_private *mad_send_wr;
 991
 992	mad_agent_priv = container_of(send_buf->mad_agent,
 993				      struct ib_mad_agent_private, agent);
 994	mad_send_wr = container_of(send_buf, struct ib_mad_send_wr_private,
 995				   send_buf);
 996
 997	free_send_rmpp_list(mad_send_wr);
 998	kfree(send_buf->mad);
 999	deref_mad_agent(mad_agent_priv);
1000}
1001EXPORT_SYMBOL(ib_free_send_mad);
1002
1003int ib_send_mad(struct ib_mad_send_wr_private *mad_send_wr)
1004{
1005	struct ib_mad_qp_info *qp_info;
1006	struct list_head *list;
1007	struct ib_send_wr *bad_send_wr;
1008	struct ib_mad_agent *mad_agent;
1009	struct ib_sge *sge;
1010	unsigned long flags;
1011	int ret;
1012
1013	/* Set WR ID to find mad_send_wr upon completion */
1014	qp_info = mad_send_wr->mad_agent_priv->qp_info;
1015	mad_send_wr->send_wr.wr_id = (unsigned long)&mad_send_wr->mad_list;
1016	mad_send_wr->mad_list.mad_queue = &qp_info->send_queue;
 
 
1017
1018	mad_agent = mad_send_wr->send_buf.mad_agent;
1019	sge = mad_send_wr->sg_list;
1020	sge[0].addr = ib_dma_map_single(mad_agent->device,
1021					mad_send_wr->send_buf.mad,
1022					sge[0].length,
1023					DMA_TO_DEVICE);
 
 
 
1024	mad_send_wr->header_mapping = sge[0].addr;
1025
1026	sge[1].addr = ib_dma_map_single(mad_agent->device,
1027					ib_get_payload(mad_send_wr),
1028					sge[1].length,
1029					DMA_TO_DEVICE);
 
 
 
 
 
 
1030	mad_send_wr->payload_mapping = sge[1].addr;
1031
1032	spin_lock_irqsave(&qp_info->send_queue.lock, flags);
1033	if (qp_info->send_queue.count < qp_info->send_queue.max_active) {
1034		ret = ib_post_send(mad_agent->qp, &mad_send_wr->send_wr,
1035				   &bad_send_wr);
1036		list = &qp_info->send_queue.list;
1037	} else {
1038		ret = 0;
1039		list = &qp_info->overflow_list;
1040	}
1041
1042	if (!ret) {
1043		qp_info->send_queue.count++;
1044		list_add_tail(&mad_send_wr->mad_list.list, list);
1045	}
1046	spin_unlock_irqrestore(&qp_info->send_queue.lock, flags);
1047	if (ret) {
1048		ib_dma_unmap_single(mad_agent->device,
1049				    mad_send_wr->header_mapping,
1050				    sge[0].length, DMA_TO_DEVICE);
1051		ib_dma_unmap_single(mad_agent->device,
1052				    mad_send_wr->payload_mapping,
1053				    sge[1].length, DMA_TO_DEVICE);
1054	}
1055	return ret;
1056}
1057
1058/*
1059 * ib_post_send_mad - Posts MAD(s) to the send queue of the QP associated
1060 *  with the registered client
1061 */
1062int ib_post_send_mad(struct ib_mad_send_buf *send_buf,
1063		     struct ib_mad_send_buf **bad_send_buf)
1064{
1065	struct ib_mad_agent_private *mad_agent_priv;
1066	struct ib_mad_send_buf *next_send_buf;
1067	struct ib_mad_send_wr_private *mad_send_wr;
1068	unsigned long flags;
1069	int ret = -EINVAL;
1070
1071	/* Walk list of send WRs and post each on send list */
1072	for (; send_buf; send_buf = next_send_buf) {
1073
1074		mad_send_wr = container_of(send_buf,
1075					   struct ib_mad_send_wr_private,
1076					   send_buf);
1077		mad_agent_priv = mad_send_wr->mad_agent_priv;
1078
 
 
 
 
 
1079		if (!send_buf->mad_agent->send_handler ||
1080		    (send_buf->timeout_ms &&
1081		     !send_buf->mad_agent->recv_handler)) {
1082			ret = -EINVAL;
1083			goto error;
1084		}
1085
1086		if (!ib_is_mad_class_rmpp(((struct ib_mad_hdr *) send_buf->mad)->mgmt_class)) {
1087			if (mad_agent_priv->agent.rmpp_version) {
1088				ret = -EINVAL;
1089				goto error;
1090			}
1091		}
1092
1093		/*
1094		 * Save pointer to next work request to post in case the
1095		 * current one completes, and the user modifies the work
1096		 * request associated with the completion
1097		 */
1098		next_send_buf = send_buf->next;
1099		mad_send_wr->send_wr.wr.ud.ah = send_buf->ah;
1100
1101		if (((struct ib_mad_hdr *) send_buf->mad)->mgmt_class ==
1102		    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE) {
1103			ret = handle_outgoing_dr_smp(mad_agent_priv,
1104						     mad_send_wr);
1105			if (ret < 0)		/* error */
1106				goto error;
1107			else if (ret == 1)	/* locally consumed */
1108				continue;
1109		}
1110
1111		mad_send_wr->tid = ((struct ib_mad_hdr *) send_buf->mad)->tid;
1112		/* Timeout will be updated after send completes */
1113		mad_send_wr->timeout = msecs_to_jiffies(send_buf->timeout_ms);
1114		mad_send_wr->max_retries = send_buf->retries;
1115		mad_send_wr->retries_left = send_buf->retries;
1116		send_buf->retries = 0;
1117		/* Reference for work request to QP + response */
1118		mad_send_wr->refcount = 1 + (mad_send_wr->timeout > 0);
1119		mad_send_wr->status = IB_WC_SUCCESS;
1120
1121		/* Reference MAD agent until send completes */
1122		atomic_inc(&mad_agent_priv->refcount);
1123		spin_lock_irqsave(&mad_agent_priv->lock, flags);
1124		list_add_tail(&mad_send_wr->agent_list,
1125			      &mad_agent_priv->send_list);
1126		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1127
1128		if (mad_agent_priv->agent.rmpp_version) {
1129			ret = ib_send_rmpp_mad(mad_send_wr);
1130			if (ret >= 0 && ret != IB_RMPP_RESULT_CONSUMED)
1131				ret = ib_send_mad(mad_send_wr);
1132		} else
1133			ret = ib_send_mad(mad_send_wr);
1134		if (ret < 0) {
1135			/* Fail send request */
1136			spin_lock_irqsave(&mad_agent_priv->lock, flags);
1137			list_del(&mad_send_wr->agent_list);
1138			spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1139			atomic_dec(&mad_agent_priv->refcount);
1140			goto error;
1141		}
1142	}
1143	return 0;
1144error:
1145	if (bad_send_buf)
1146		*bad_send_buf = send_buf;
1147	return ret;
1148}
1149EXPORT_SYMBOL(ib_post_send_mad);
1150
1151/*
1152 * ib_free_recv_mad - Returns data buffers used to receive
1153 *  a MAD to the access layer
1154 */
1155void ib_free_recv_mad(struct ib_mad_recv_wc *mad_recv_wc)
1156{
1157	struct ib_mad_recv_buf *mad_recv_buf, *temp_recv_buf;
1158	struct ib_mad_private_header *mad_priv_hdr;
1159	struct ib_mad_private *priv;
1160	struct list_head free_list;
1161
1162	INIT_LIST_HEAD(&free_list);
1163	list_splice_init(&mad_recv_wc->rmpp_list, &free_list);
1164
1165	list_for_each_entry_safe(mad_recv_buf, temp_recv_buf,
1166					&free_list, list) {
1167		mad_recv_wc = container_of(mad_recv_buf, struct ib_mad_recv_wc,
1168					   recv_buf);
1169		mad_priv_hdr = container_of(mad_recv_wc,
1170					    struct ib_mad_private_header,
1171					    recv_wc);
1172		priv = container_of(mad_priv_hdr, struct ib_mad_private,
1173				    header);
1174		kmem_cache_free(ib_mad_cache, priv);
1175	}
1176}
1177EXPORT_SYMBOL(ib_free_recv_mad);
1178
1179struct ib_mad_agent *ib_redirect_mad_qp(struct ib_qp *qp,
1180					u8 rmpp_version,
1181					ib_mad_send_handler send_handler,
1182					ib_mad_recv_handler recv_handler,
1183					void *context)
1184{
1185	return ERR_PTR(-EINVAL);	/* XXX: for now */
1186}
1187EXPORT_SYMBOL(ib_redirect_mad_qp);
1188
1189int ib_process_mad_wc(struct ib_mad_agent *mad_agent,
1190		      struct ib_wc *wc)
1191{
1192	printk(KERN_ERR PFX "ib_process_mad_wc() not implemented yet\n");
 
1193	return 0;
1194}
1195EXPORT_SYMBOL(ib_process_mad_wc);
1196
1197static int method_in_use(struct ib_mad_mgmt_method_table **method,
1198			 struct ib_mad_reg_req *mad_reg_req)
1199{
1200	int i;
1201
1202	for_each_set_bit(i, mad_reg_req->method_mask, IB_MGMT_MAX_METHODS) {
1203		if ((*method)->agent[i]) {
1204			printk(KERN_ERR PFX "Method %d already in use\n", i);
1205			return -EINVAL;
1206		}
1207	}
1208	return 0;
1209}
1210
1211static int allocate_method_table(struct ib_mad_mgmt_method_table **method)
1212{
1213	/* Allocate management method table */
1214	*method = kzalloc(sizeof **method, GFP_ATOMIC);
1215	if (!*method) {
1216		printk(KERN_ERR PFX "No memory for "
1217		       "ib_mad_mgmt_method_table\n");
1218		return -ENOMEM;
1219	}
1220
1221	return 0;
1222}
1223
1224/*
1225 * Check to see if there are any methods still in use
1226 */
1227static int check_method_table(struct ib_mad_mgmt_method_table *method)
1228{
1229	int i;
1230
1231	for (i = 0; i < IB_MGMT_MAX_METHODS; i++)
1232		if (method->agent[i])
1233			return 1;
1234	return 0;
1235}
1236
1237/*
1238 * Check to see if there are any method tables for this class still in use
1239 */
1240static int check_class_table(struct ib_mad_mgmt_class_table *class)
1241{
1242	int i;
1243
1244	for (i = 0; i < MAX_MGMT_CLASS; i++)
1245		if (class->method_table[i])
1246			return 1;
1247	return 0;
1248}
1249
1250static int check_vendor_class(struct ib_mad_mgmt_vendor_class *vendor_class)
1251{
1252	int i;
1253
1254	for (i = 0; i < MAX_MGMT_OUI; i++)
1255		if (vendor_class->method_table[i])
1256			return 1;
1257	return 0;
1258}
1259
1260static int find_vendor_oui(struct ib_mad_mgmt_vendor_class *vendor_class,
1261			   char *oui)
1262{
1263	int i;
1264
1265	for (i = 0; i < MAX_MGMT_OUI; i++)
1266		/* Is there matching OUI for this vendor class ? */
1267		if (!memcmp(vendor_class->oui[i], oui, 3))
1268			return i;
1269
1270	return -1;
1271}
1272
1273static int check_vendor_table(struct ib_mad_mgmt_vendor_class_table *vendor)
1274{
1275	int i;
1276
1277	for (i = 0; i < MAX_MGMT_VENDOR_RANGE2; i++)
1278		if (vendor->vendor_class[i])
1279			return 1;
1280
1281	return 0;
1282}
1283
1284static void remove_methods_mad_agent(struct ib_mad_mgmt_method_table *method,
1285				     struct ib_mad_agent_private *agent)
1286{
1287	int i;
1288
1289	/* Remove any methods for this mad agent */
1290	for (i = 0; i < IB_MGMT_MAX_METHODS; i++) {
1291		if (method->agent[i] == agent) {
1292			method->agent[i] = NULL;
1293		}
1294	}
1295}
1296
1297static int add_nonoui_reg_req(struct ib_mad_reg_req *mad_reg_req,
1298			      struct ib_mad_agent_private *agent_priv,
1299			      u8 mgmt_class)
1300{
1301	struct ib_mad_port_private *port_priv;
1302	struct ib_mad_mgmt_class_table **class;
1303	struct ib_mad_mgmt_method_table **method;
1304	int i, ret;
1305
1306	port_priv = agent_priv->qp_info->port_priv;
1307	class = &port_priv->version[mad_reg_req->mgmt_class_version].class;
1308	if (!*class) {
1309		/* Allocate management class table for "new" class version */
1310		*class = kzalloc(sizeof **class, GFP_ATOMIC);
1311		if (!*class) {
1312			printk(KERN_ERR PFX "No memory for "
1313			       "ib_mad_mgmt_class_table\n");
1314			ret = -ENOMEM;
1315			goto error1;
1316		}
1317
1318		/* Allocate method table for this management class */
1319		method = &(*class)->method_table[mgmt_class];
1320		if ((ret = allocate_method_table(method)))
1321			goto error2;
1322	} else {
1323		method = &(*class)->method_table[mgmt_class];
1324		if (!*method) {
1325			/* Allocate method table for this management class */
1326			if ((ret = allocate_method_table(method)))
1327				goto error1;
1328		}
1329	}
1330
1331	/* Now, make sure methods are not already in use */
1332	if (method_in_use(method, mad_reg_req))
1333		goto error3;
1334
1335	/* Finally, add in methods being registered */
1336	for_each_set_bit(i, mad_reg_req->method_mask, IB_MGMT_MAX_METHODS)
1337		(*method)->agent[i] = agent_priv;
1338
1339	return 0;
1340
1341error3:
1342	/* Remove any methods for this mad agent */
1343	remove_methods_mad_agent(*method, agent_priv);
1344	/* Now, check to see if there are any methods in use */
1345	if (!check_method_table(*method)) {
1346		/* If not, release management method table */
1347		kfree(*method);
1348		*method = NULL;
1349	}
1350	ret = -EINVAL;
1351	goto error1;
1352error2:
1353	kfree(*class);
1354	*class = NULL;
1355error1:
1356	return ret;
1357}
1358
1359static int add_oui_reg_req(struct ib_mad_reg_req *mad_reg_req,
1360			   struct ib_mad_agent_private *agent_priv)
1361{
1362	struct ib_mad_port_private *port_priv;
1363	struct ib_mad_mgmt_vendor_class_table **vendor_table;
1364	struct ib_mad_mgmt_vendor_class_table *vendor = NULL;
1365	struct ib_mad_mgmt_vendor_class *vendor_class = NULL;
1366	struct ib_mad_mgmt_method_table **method;
1367	int i, ret = -ENOMEM;
1368	u8 vclass;
1369
1370	/* "New" vendor (with OUI) class */
1371	vclass = vendor_class_index(mad_reg_req->mgmt_class);
1372	port_priv = agent_priv->qp_info->port_priv;
1373	vendor_table = &port_priv->version[
1374				mad_reg_req->mgmt_class_version].vendor;
1375	if (!*vendor_table) {
1376		/* Allocate mgmt vendor class table for "new" class version */
1377		vendor = kzalloc(sizeof *vendor, GFP_ATOMIC);
1378		if (!vendor) {
1379			printk(KERN_ERR PFX "No memory for "
1380			       "ib_mad_mgmt_vendor_class_table\n");
1381			goto error1;
1382		}
1383
1384		*vendor_table = vendor;
1385	}
1386	if (!(*vendor_table)->vendor_class[vclass]) {
1387		/* Allocate table for this management vendor class */
1388		vendor_class = kzalloc(sizeof *vendor_class, GFP_ATOMIC);
1389		if (!vendor_class) {
1390			printk(KERN_ERR PFX "No memory for "
1391			       "ib_mad_mgmt_vendor_class\n");
1392			goto error2;
1393		}
1394
1395		(*vendor_table)->vendor_class[vclass] = vendor_class;
1396	}
1397	for (i = 0; i < MAX_MGMT_OUI; i++) {
1398		/* Is there matching OUI for this vendor class ? */
1399		if (!memcmp((*vendor_table)->vendor_class[vclass]->oui[i],
1400			    mad_reg_req->oui, 3)) {
1401			method = &(*vendor_table)->vendor_class[
1402						vclass]->method_table[i];
1403			BUG_ON(!*method);
1404			goto check_in_use;
1405		}
1406	}
1407	for (i = 0; i < MAX_MGMT_OUI; i++) {
1408		/* OUI slot available ? */
1409		if (!is_vendor_oui((*vendor_table)->vendor_class[
1410				vclass]->oui[i])) {
1411			method = &(*vendor_table)->vendor_class[
1412				vclass]->method_table[i];
1413			BUG_ON(*method);
1414			/* Allocate method table for this OUI */
1415			if ((ret = allocate_method_table(method)))
1416				goto error3;
1417			memcpy((*vendor_table)->vendor_class[vclass]->oui[i],
1418			       mad_reg_req->oui, 3);
1419			goto check_in_use;
1420		}
1421	}
1422	printk(KERN_ERR PFX "All OUI slots in use\n");
1423	goto error3;
1424
1425check_in_use:
1426	/* Now, make sure methods are not already in use */
1427	if (method_in_use(method, mad_reg_req))
1428		goto error4;
1429
1430	/* Finally, add in methods being registered */
1431	for_each_set_bit(i, mad_reg_req->method_mask, IB_MGMT_MAX_METHODS)
1432		(*method)->agent[i] = agent_priv;
1433
1434	return 0;
1435
1436error4:
1437	/* Remove any methods for this mad agent */
1438	remove_methods_mad_agent(*method, agent_priv);
1439	/* Now, check to see if there are any methods in use */
1440	if (!check_method_table(*method)) {
1441		/* If not, release management method table */
1442		kfree(*method);
1443		*method = NULL;
1444	}
1445	ret = -EINVAL;
1446error3:
1447	if (vendor_class) {
1448		(*vendor_table)->vendor_class[vclass] = NULL;
1449		kfree(vendor_class);
1450	}
1451error2:
1452	if (vendor) {
1453		*vendor_table = NULL;
1454		kfree(vendor);
1455	}
1456error1:
1457	return ret;
1458}
1459
1460static void remove_mad_reg_req(struct ib_mad_agent_private *agent_priv)
1461{
1462	struct ib_mad_port_private *port_priv;
1463	struct ib_mad_mgmt_class_table *class;
1464	struct ib_mad_mgmt_method_table *method;
1465	struct ib_mad_mgmt_vendor_class_table *vendor;
1466	struct ib_mad_mgmt_vendor_class *vendor_class;
1467	int index;
1468	u8 mgmt_class;
1469
1470	/*
1471	 * Was MAD registration request supplied
1472	 * with original registration ?
1473	 */
1474	if (!agent_priv->reg_req) {
1475		goto out;
1476	}
1477
1478	port_priv = agent_priv->qp_info->port_priv;
1479	mgmt_class = convert_mgmt_class(agent_priv->reg_req->mgmt_class);
1480	class = port_priv->version[
1481			agent_priv->reg_req->mgmt_class_version].class;
1482	if (!class)
1483		goto vendor_check;
1484
1485	method = class->method_table[mgmt_class];
1486	if (method) {
1487		/* Remove any methods for this mad agent */
1488		remove_methods_mad_agent(method, agent_priv);
1489		/* Now, check to see if there are any methods still in use */
1490		if (!check_method_table(method)) {
1491			/* If not, release management method table */
1492			 kfree(method);
1493			 class->method_table[mgmt_class] = NULL;
1494			 /* Any management classes left ? */
1495			if (!check_class_table(class)) {
1496				/* If not, release management class table */
1497				kfree(class);
1498				port_priv->version[
1499					agent_priv->reg_req->
1500					mgmt_class_version].class = NULL;
1501			}
1502		}
1503	}
1504
1505vendor_check:
1506	if (!is_vendor_class(mgmt_class))
1507		goto out;
1508
1509	/* normalize mgmt_class to vendor range 2 */
1510	mgmt_class = vendor_class_index(agent_priv->reg_req->mgmt_class);
1511	vendor = port_priv->version[
1512			agent_priv->reg_req->mgmt_class_version].vendor;
1513
1514	if (!vendor)
1515		goto out;
1516
1517	vendor_class = vendor->vendor_class[mgmt_class];
1518	if (vendor_class) {
1519		index = find_vendor_oui(vendor_class, agent_priv->reg_req->oui);
1520		if (index < 0)
1521			goto out;
1522		method = vendor_class->method_table[index];
1523		if (method) {
1524			/* Remove any methods for this mad agent */
1525			remove_methods_mad_agent(method, agent_priv);
1526			/*
1527			 * Now, check to see if there are
1528			 * any methods still in use
1529			 */
1530			if (!check_method_table(method)) {
1531				/* If not, release management method table */
1532				kfree(method);
1533				vendor_class->method_table[index] = NULL;
1534				memset(vendor_class->oui[index], 0, 3);
1535				/* Any OUIs left ? */
1536				if (!check_vendor_class(vendor_class)) {
1537					/* If not, release vendor class table */
1538					kfree(vendor_class);
1539					vendor->vendor_class[mgmt_class] = NULL;
1540					/* Any other vendor classes left ? */
1541					if (!check_vendor_table(vendor)) {
1542						kfree(vendor);
1543						port_priv->version[
1544							agent_priv->reg_req->
1545							mgmt_class_version].
1546							vendor = NULL;
1547					}
1548				}
1549			}
1550		}
1551	}
1552
1553out:
1554	return;
1555}
1556
1557static struct ib_mad_agent_private *
1558find_mad_agent(struct ib_mad_port_private *port_priv,
1559	       struct ib_mad *mad)
1560{
1561	struct ib_mad_agent_private *mad_agent = NULL;
1562	unsigned long flags;
1563
1564	spin_lock_irqsave(&port_priv->reg_lock, flags);
1565	if (ib_response_mad(mad)) {
1566		u32 hi_tid;
1567		struct ib_mad_agent_private *entry;
1568
1569		/*
1570		 * Routing is based on high 32 bits of transaction ID
1571		 * of MAD.
1572		 */
1573		hi_tid = be64_to_cpu(mad->mad_hdr.tid) >> 32;
1574		list_for_each_entry(entry, &port_priv->agent_list, agent_list) {
1575			if (entry->agent.hi_tid == hi_tid) {
1576				mad_agent = entry;
1577				break;
1578			}
1579		}
1580	} else {
1581		struct ib_mad_mgmt_class_table *class;
1582		struct ib_mad_mgmt_method_table *method;
1583		struct ib_mad_mgmt_vendor_class_table *vendor;
1584		struct ib_mad_mgmt_vendor_class *vendor_class;
1585		struct ib_vendor_mad *vendor_mad;
1586		int index;
1587
1588		/*
1589		 * Routing is based on version, class, and method
1590		 * For "newer" vendor MADs, also based on OUI
1591		 */
1592		if (mad->mad_hdr.class_version >= MAX_MGMT_VERSION)
1593			goto out;
1594		if (!is_vendor_class(mad->mad_hdr.mgmt_class)) {
1595			class = port_priv->version[
1596					mad->mad_hdr.class_version].class;
1597			if (!class)
1598				goto out;
 
 
 
1599			method = class->method_table[convert_mgmt_class(
1600							mad->mad_hdr.mgmt_class)];
1601			if (method)
1602				mad_agent = method->agent[mad->mad_hdr.method &
1603							  ~IB_MGMT_METHOD_RESP];
1604		} else {
1605			vendor = port_priv->version[
1606					mad->mad_hdr.class_version].vendor;
1607			if (!vendor)
1608				goto out;
1609			vendor_class = vendor->vendor_class[vendor_class_index(
1610						mad->mad_hdr.mgmt_class)];
1611			if (!vendor_class)
1612				goto out;
1613			/* Find matching OUI */
1614			vendor_mad = (struct ib_vendor_mad *)mad;
1615			index = find_vendor_oui(vendor_class, vendor_mad->oui);
1616			if (index == -1)
1617				goto out;
1618			method = vendor_class->method_table[index];
1619			if (method) {
1620				mad_agent = method->agent[mad->mad_hdr.method &
1621							  ~IB_MGMT_METHOD_RESP];
1622			}
1623		}
1624	}
1625
1626	if (mad_agent) {
1627		if (mad_agent->agent.recv_handler)
1628			atomic_inc(&mad_agent->refcount);
1629		else {
1630			printk(KERN_NOTICE PFX "No receive handler for client "
1631			       "%p on port %d\n",
1632			       &mad_agent->agent, port_priv->port_num);
1633			mad_agent = NULL;
1634		}
1635	}
1636out:
1637	spin_unlock_irqrestore(&port_priv->reg_lock, flags);
1638
1639	return mad_agent;
1640}
1641
1642static int validate_mad(struct ib_mad *mad, u32 qp_num)
 
 
1643{
1644	int valid = 0;
 
1645
1646	/* Make sure MAD base version is understood */
1647	if (mad->mad_hdr.base_version != IB_MGMT_BASE_VERSION) {
1648		printk(KERN_ERR PFX "MAD received with unsupported base "
1649		       "version %d\n", mad->mad_hdr.base_version);
 
1650		goto out;
1651	}
1652
1653	/* Filter SMI packets sent to other than QP0 */
1654	if ((mad->mad_hdr.mgmt_class == IB_MGMT_CLASS_SUBN_LID_ROUTED) ||
1655	    (mad->mad_hdr.mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)) {
1656		if (qp_num == 0)
1657			valid = 1;
1658	} else {
 
 
 
 
 
1659		/* Filter GSI packets sent to QP0 */
1660		if (qp_num != 0)
1661			valid = 1;
1662	}
1663
1664out:
1665	return valid;
1666}
1667
1668static int is_data_mad(struct ib_mad_agent_private *mad_agent_priv,
1669		       struct ib_mad_hdr *mad_hdr)
1670{
1671	struct ib_rmpp_mad *rmpp_mad;
1672
1673	rmpp_mad = (struct ib_rmpp_mad *)mad_hdr;
1674	return !mad_agent_priv->agent.rmpp_version ||
 
1675		!(ib_get_rmpp_flags(&rmpp_mad->rmpp_hdr) &
1676				    IB_MGMT_RMPP_FLAG_ACTIVE) ||
1677		(rmpp_mad->rmpp_hdr.rmpp_type == IB_MGMT_RMPP_TYPE_DATA);
1678}
1679
1680static inline int rcv_has_same_class(struct ib_mad_send_wr_private *wr,
1681				     struct ib_mad_recv_wc *rwc)
1682{
1683	return ((struct ib_mad *)(wr->send_buf.mad))->mad_hdr.mgmt_class ==
1684		rwc->recv_buf.mad->mad_hdr.mgmt_class;
1685}
1686
1687static inline int rcv_has_same_gid(struct ib_mad_agent_private *mad_agent_priv,
1688				   struct ib_mad_send_wr_private *wr,
1689				   struct ib_mad_recv_wc *rwc )
1690{
1691	struct ib_ah_attr attr;
1692	u8 send_resp, rcv_resp;
1693	union ib_gid sgid;
1694	struct ib_device *device = mad_agent_priv->agent.device;
1695	u8 port_num = mad_agent_priv->agent.port_num;
1696	u8 lmc;
 
1697
1698	send_resp = ib_response_mad((struct ib_mad *)wr->send_buf.mad);
1699	rcv_resp = ib_response_mad(rwc->recv_buf.mad);
1700
1701	if (send_resp == rcv_resp)
1702		/* both requests, or both responses. GIDs different */
1703		return 0;
1704
1705	if (ib_query_ah(wr->send_buf.ah, &attr))
1706		/* Assume not equal, to avoid false positives. */
1707		return 0;
1708
1709	if (!!(attr.ah_flags & IB_AH_GRH) !=
1710	    !!(rwc->wc->wc_flags & IB_WC_GRH))
1711		/* one has GID, other does not.  Assume different */
1712		return 0;
1713
1714	if (!send_resp && rcv_resp) {
1715		/* is request/response. */
1716		if (!(attr.ah_flags & IB_AH_GRH)) {
1717			if (ib_get_cached_lmc(device, port_num, &lmc))
1718				return 0;
1719			return (!lmc || !((attr.src_path_bits ^
1720					   rwc->wc->dlid_path_bits) &
1721					  ((1 << lmc) - 1)));
1722		} else {
 
 
 
1723			if (ib_get_cached_gid(device, port_num,
1724					      attr.grh.sgid_index, &sgid))
1725				return 0;
1726			return !memcmp(sgid.raw, rwc->recv_buf.grh->dgid.raw,
1727				       16);
1728		}
1729	}
1730
1731	if (!(attr.ah_flags & IB_AH_GRH))
1732		return attr.dlid == rwc->wc->slid;
1733	else
1734		return !memcmp(attr.grh.dgid.raw, rwc->recv_buf.grh->sgid.raw,
 
1735			       16);
1736}
1737
1738static inline int is_direct(u8 class)
1739{
1740	return (class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE);
1741}
1742
1743struct ib_mad_send_wr_private*
1744ib_find_send_mad(struct ib_mad_agent_private *mad_agent_priv,
1745		 struct ib_mad_recv_wc *wc)
1746{
1747	struct ib_mad_send_wr_private *wr;
1748	struct ib_mad *mad;
1749
1750	mad = (struct ib_mad *)wc->recv_buf.mad;
1751
1752	list_for_each_entry(wr, &mad_agent_priv->wait_list, agent_list) {
1753		if ((wr->tid == mad->mad_hdr.tid) &&
1754		    rcv_has_same_class(wr, wc) &&
1755		    /*
1756		     * Don't check GID for direct routed MADs.
1757		     * These might have permissive LIDs.
1758		     */
1759		    (is_direct(wc->recv_buf.mad->mad_hdr.mgmt_class) ||
1760		     rcv_has_same_gid(mad_agent_priv, wr, wc)))
1761			return (wr->status == IB_WC_SUCCESS) ? wr : NULL;
1762	}
1763
1764	/*
1765	 * It's possible to receive the response before we've
1766	 * been notified that the send has completed
1767	 */
1768	list_for_each_entry(wr, &mad_agent_priv->send_list, agent_list) {
1769		if (is_data_mad(mad_agent_priv, wr->send_buf.mad) &&
1770		    wr->tid == mad->mad_hdr.tid &&
1771		    wr->timeout &&
1772		    rcv_has_same_class(wr, wc) &&
1773		    /*
1774		     * Don't check GID for direct routed MADs.
1775		     * These might have permissive LIDs.
1776		     */
1777		    (is_direct(wc->recv_buf.mad->mad_hdr.mgmt_class) ||
1778		     rcv_has_same_gid(mad_agent_priv, wr, wc)))
1779			/* Verify request has not been canceled */
1780			return (wr->status == IB_WC_SUCCESS) ? wr : NULL;
1781	}
1782	return NULL;
1783}
1784
1785void ib_mark_mad_done(struct ib_mad_send_wr_private *mad_send_wr)
1786{
1787	mad_send_wr->timeout = 0;
1788	if (mad_send_wr->refcount == 1)
1789		list_move_tail(&mad_send_wr->agent_list,
1790			      &mad_send_wr->mad_agent_priv->done_list);
1791}
1792
1793static void ib_mad_complete_recv(struct ib_mad_agent_private *mad_agent_priv,
1794				 struct ib_mad_recv_wc *mad_recv_wc)
1795{
1796	struct ib_mad_send_wr_private *mad_send_wr;
1797	struct ib_mad_send_wc mad_send_wc;
1798	unsigned long flags;
 
1799
1800	INIT_LIST_HEAD(&mad_recv_wc->rmpp_list);
 
 
 
 
 
 
 
 
1801	list_add(&mad_recv_wc->recv_buf.list, &mad_recv_wc->rmpp_list);
1802	if (mad_agent_priv->agent.rmpp_version) {
1803		mad_recv_wc = ib_process_rmpp_recv_wc(mad_agent_priv,
1804						      mad_recv_wc);
1805		if (!mad_recv_wc) {
1806			deref_mad_agent(mad_agent_priv);
1807			return;
1808		}
1809	}
1810
1811	/* Complete corresponding request */
1812	if (ib_response_mad(mad_recv_wc->recv_buf.mad)) {
1813		spin_lock_irqsave(&mad_agent_priv->lock, flags);
1814		mad_send_wr = ib_find_send_mad(mad_agent_priv, mad_recv_wc);
1815		if (!mad_send_wr) {
1816			spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1817			ib_free_recv_mad(mad_recv_wc);
1818			deref_mad_agent(mad_agent_priv);
1819			return;
1820		}
1821		ib_mark_mad_done(mad_send_wr);
1822		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1823
1824		/* Defined behavior is to complete response before request */
1825		mad_recv_wc->wc->wr_id = (unsigned long) &mad_send_wr->send_buf;
1826		mad_agent_priv->agent.recv_handler(&mad_agent_priv->agent,
1827						   mad_recv_wc);
1828		atomic_dec(&mad_agent_priv->refcount);
 
1829
1830		mad_send_wc.status = IB_WC_SUCCESS;
1831		mad_send_wc.vendor_err = 0;
1832		mad_send_wc.send_buf = &mad_send_wr->send_buf;
1833		ib_mad_complete_send_wr(mad_send_wr, &mad_send_wc);
 
1834	} else {
1835		mad_agent_priv->agent.recv_handler(&mad_agent_priv->agent,
1836						   mad_recv_wc);
1837		deref_mad_agent(mad_agent_priv);
1838	}
 
 
1839}
1840
1841static void ib_mad_recv_done_handler(struct ib_mad_port_private *port_priv,
1842				     struct ib_wc *wc)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1843{
 
 
 
1844	struct ib_mad_qp_info *qp_info;
1845	struct ib_mad_private_header *mad_priv_hdr;
1846	struct ib_mad_private *recv, *response = NULL;
1847	struct ib_mad_list_head *mad_list;
1848	struct ib_mad_agent_private *mad_agent;
1849	int port_num;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1850
1851	mad_list = (struct ib_mad_list_head *)(unsigned long)wc->wr_id;
1852	qp_info = mad_list->mad_queue->qp_info;
1853	dequeue_mad(mad_list);
1854
 
 
 
1855	mad_priv_hdr = container_of(mad_list, struct ib_mad_private_header,
1856				    mad_list);
1857	recv = container_of(mad_priv_hdr, struct ib_mad_private, header);
1858	ib_dma_unmap_single(port_priv->device,
1859			    recv->header.mapping,
1860			    sizeof(struct ib_mad_private) -
1861			      sizeof(struct ib_mad_private_header),
1862			    DMA_FROM_DEVICE);
1863
1864	/* Setup MAD receive work completion from "normal" work completion */
1865	recv->header.wc = *wc;
1866	recv->header.recv_wc.wc = &recv->header.wc;
1867	recv->header.recv_wc.mad_len = sizeof(struct ib_mad);
1868	recv->header.recv_wc.recv_buf.mad = &recv->mad.mad;
 
 
 
 
 
 
 
 
1869	recv->header.recv_wc.recv_buf.grh = &recv->grh;
1870
1871	if (atomic_read(&qp_info->snoop_count))
1872		snoop_recv(qp_info, &recv->header.recv_wc, IB_MAD_SNOOP_RECVS);
1873
1874	/* Validate MAD */
1875	if (!validate_mad(&recv->mad.mad, qp_info->qp->qp_num))
1876		goto out;
1877
1878	response = kmem_cache_alloc(ib_mad_cache, GFP_KERNEL);
1879	if (!response) {
1880		printk(KERN_ERR PFX "ib_mad_recv_done_handler no memory "
1881		       "for response buffer\n");
1882		goto out;
1883	}
1884
1885	if (port_priv->device->node_type == RDMA_NODE_IB_SWITCH)
1886		port_num = wc->port_num;
1887	else
1888		port_num = port_priv->port_num;
1889
1890	if (recv->mad.mad.mad_hdr.mgmt_class ==
1891	    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE) {
1892		enum smi_forward_action retsmi;
1893
1894		if (smi_handle_dr_smp_recv(&recv->mad.smp,
1895					   port_priv->device->node_type,
1896					   port_num,
1897					   port_priv->device->phys_port_cnt) ==
1898					   IB_SMI_DISCARD)
1899			goto out;
1900
1901		retsmi = smi_check_forward_dr_smp(&recv->mad.smp);
1902		if (retsmi == IB_SMI_LOCAL)
1903			goto local;
1904
1905		if (retsmi == IB_SMI_SEND) { /* don't forward */
1906			if (smi_handle_dr_smp_send(&recv->mad.smp,
1907						   port_priv->device->node_type,
1908						   port_num) == IB_SMI_DISCARD)
1909				goto out;
1910
1911			if (smi_check_local_smp(&recv->mad.smp, port_priv->device) == IB_SMI_DISCARD)
1912				goto out;
1913		} else if (port_priv->device->node_type == RDMA_NODE_IB_SWITCH) {
1914			/* forward case for switches */
1915			memcpy(response, recv, sizeof(*response));
1916			response->header.recv_wc.wc = &response->header.wc;
1917			response->header.recv_wc.recv_buf.mad = &response->mad.mad;
1918			response->header.recv_wc.recv_buf.grh = &response->grh;
1919
1920			agent_send_response(&response->mad.mad,
1921					    &response->grh, wc,
1922					    port_priv->device,
1923					    smi_get_fwd_port(&recv->mad.smp),
1924					    qp_info->qp->qp_num);
1925
1926			goto out;
1927		}
1928	}
1929
1930local:
1931	/* Give driver "right of first refusal" on incoming MAD */
1932	if (port_priv->device->process_mad) {
1933		int ret;
1934
1935		ret = port_priv->device->process_mad(port_priv->device, 0,
1936						     port_priv->port_num,
1937						     wc, &recv->grh,
1938						     &recv->mad.mad,
1939						     &response->mad.mad);
 
 
 
 
 
 
1940		if (ret & IB_MAD_RESULT_SUCCESS) {
1941			if (ret & IB_MAD_RESULT_CONSUMED)
1942				goto out;
1943			if (ret & IB_MAD_RESULT_REPLY) {
1944				agent_send_response(&response->mad.mad,
1945						    &recv->grh, wc,
1946						    port_priv->device,
1947						    port_num,
1948						    qp_info->qp->qp_num);
 
1949				goto out;
1950			}
1951		}
1952	}
1953
1954	mad_agent = find_mad_agent(port_priv, &recv->mad.mad);
1955	if (mad_agent) {
1956		ib_mad_complete_recv(mad_agent, &recv->header.recv_wc);
1957		/*
1958		 * recv is freed up in error cases in ib_mad_complete_recv
1959		 * or via recv_handler in ib_mad_complete_recv()
1960		 */
1961		recv = NULL;
 
 
 
 
 
1962	}
1963
1964out:
1965	/* Post another receive request for this QP */
1966	if (response) {
1967		ib_mad_post_receive_mads(qp_info, response);
1968		if (recv)
1969			kmem_cache_free(ib_mad_cache, recv);
1970	} else
1971		ib_mad_post_receive_mads(qp_info, recv);
1972}
1973
1974static void adjust_timeout(struct ib_mad_agent_private *mad_agent_priv)
1975{
1976	struct ib_mad_send_wr_private *mad_send_wr;
1977	unsigned long delay;
1978
1979	if (list_empty(&mad_agent_priv->wait_list)) {
1980		__cancel_delayed_work(&mad_agent_priv->timed_work);
1981	} else {
1982		mad_send_wr = list_entry(mad_agent_priv->wait_list.next,
1983					 struct ib_mad_send_wr_private,
1984					 agent_list);
1985
1986		if (time_after(mad_agent_priv->timeout,
1987			       mad_send_wr->timeout)) {
1988			mad_agent_priv->timeout = mad_send_wr->timeout;
1989			__cancel_delayed_work(&mad_agent_priv->timed_work);
1990			delay = mad_send_wr->timeout - jiffies;
1991			if ((long)delay <= 0)
1992				delay = 1;
1993			queue_delayed_work(mad_agent_priv->qp_info->
1994					   port_priv->wq,
1995					   &mad_agent_priv->timed_work, delay);
1996		}
1997	}
1998}
1999
2000static void wait_for_response(struct ib_mad_send_wr_private *mad_send_wr)
2001{
2002	struct ib_mad_agent_private *mad_agent_priv;
2003	struct ib_mad_send_wr_private *temp_mad_send_wr;
2004	struct list_head *list_item;
2005	unsigned long delay;
2006
2007	mad_agent_priv = mad_send_wr->mad_agent_priv;
2008	list_del(&mad_send_wr->agent_list);
2009
2010	delay = mad_send_wr->timeout;
2011	mad_send_wr->timeout += jiffies;
2012
2013	if (delay) {
2014		list_for_each_prev(list_item, &mad_agent_priv->wait_list) {
2015			temp_mad_send_wr = list_entry(list_item,
2016						struct ib_mad_send_wr_private,
2017						agent_list);
2018			if (time_after(mad_send_wr->timeout,
2019				       temp_mad_send_wr->timeout))
2020				break;
2021		}
2022	}
2023	else
2024		list_item = &mad_agent_priv->wait_list;
2025	list_add(&mad_send_wr->agent_list, list_item);
2026
2027	/* Reschedule a work item if we have a shorter timeout */
2028	if (mad_agent_priv->wait_list.next == &mad_send_wr->agent_list) {
2029		__cancel_delayed_work(&mad_agent_priv->timed_work);
2030		queue_delayed_work(mad_agent_priv->qp_info->port_priv->wq,
2031				   &mad_agent_priv->timed_work, delay);
2032	}
2033}
2034
2035void ib_reset_mad_timeout(struct ib_mad_send_wr_private *mad_send_wr,
2036			  int timeout_ms)
2037{
2038	mad_send_wr->timeout = msecs_to_jiffies(timeout_ms);
2039	wait_for_response(mad_send_wr);
2040}
2041
2042/*
2043 * Process a send work completion
2044 */
2045void ib_mad_complete_send_wr(struct ib_mad_send_wr_private *mad_send_wr,
2046			     struct ib_mad_send_wc *mad_send_wc)
2047{
2048	struct ib_mad_agent_private	*mad_agent_priv;
2049	unsigned long			flags;
2050	int				ret;
2051
2052	mad_agent_priv = mad_send_wr->mad_agent_priv;
2053	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2054	if (mad_agent_priv->agent.rmpp_version) {
2055		ret = ib_process_rmpp_send_wc(mad_send_wr, mad_send_wc);
2056		if (ret == IB_RMPP_RESULT_CONSUMED)
2057			goto done;
2058	} else
2059		ret = IB_RMPP_RESULT_UNHANDLED;
2060
2061	if (mad_send_wc->status != IB_WC_SUCCESS &&
2062	    mad_send_wr->status == IB_WC_SUCCESS) {
2063		mad_send_wr->status = mad_send_wc->status;
2064		mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2065	}
2066
2067	if (--mad_send_wr->refcount > 0) {
2068		if (mad_send_wr->refcount == 1 && mad_send_wr->timeout &&
2069		    mad_send_wr->status == IB_WC_SUCCESS) {
2070			wait_for_response(mad_send_wr);
2071		}
2072		goto done;
2073	}
2074
2075	/* Remove send from MAD agent and notify client of completion */
2076	list_del(&mad_send_wr->agent_list);
2077	adjust_timeout(mad_agent_priv);
2078	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2079
2080	if (mad_send_wr->status != IB_WC_SUCCESS )
2081		mad_send_wc->status = mad_send_wr->status;
2082	if (ret == IB_RMPP_RESULT_INTERNAL)
2083		ib_rmpp_send_handler(mad_send_wc);
2084	else
2085		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2086						   mad_send_wc);
2087
2088	/* Release reference on agent taken when sending */
2089	deref_mad_agent(mad_agent_priv);
2090	return;
2091done:
2092	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2093}
2094
2095static void ib_mad_send_done_handler(struct ib_mad_port_private *port_priv,
2096				     struct ib_wc *wc)
2097{
 
 
 
2098	struct ib_mad_send_wr_private	*mad_send_wr, *queued_send_wr;
2099	struct ib_mad_list_head		*mad_list;
2100	struct ib_mad_qp_info		*qp_info;
2101	struct ib_mad_queue		*send_queue;
2102	struct ib_send_wr		*bad_send_wr;
2103	struct ib_mad_send_wc		mad_send_wc;
2104	unsigned long flags;
2105	int ret;
2106
2107	mad_list = (struct ib_mad_list_head *)(unsigned long)wc->wr_id;
 
 
 
 
 
 
 
2108	mad_send_wr = container_of(mad_list, struct ib_mad_send_wr_private,
2109				   mad_list);
2110	send_queue = mad_list->mad_queue;
2111	qp_info = send_queue->qp_info;
2112
2113retry:
2114	ib_dma_unmap_single(mad_send_wr->send_buf.mad_agent->device,
2115			    mad_send_wr->header_mapping,
2116			    mad_send_wr->sg_list[0].length, DMA_TO_DEVICE);
2117	ib_dma_unmap_single(mad_send_wr->send_buf.mad_agent->device,
2118			    mad_send_wr->payload_mapping,
2119			    mad_send_wr->sg_list[1].length, DMA_TO_DEVICE);
2120	queued_send_wr = NULL;
2121	spin_lock_irqsave(&send_queue->lock, flags);
2122	list_del(&mad_list->list);
2123
2124	/* Move queued send to the send queue */
2125	if (send_queue->count-- > send_queue->max_active) {
2126		mad_list = container_of(qp_info->overflow_list.next,
2127					struct ib_mad_list_head, list);
2128		queued_send_wr = container_of(mad_list,
2129					struct ib_mad_send_wr_private,
2130					mad_list);
2131		list_move_tail(&mad_list->list, &send_queue->list);
2132	}
2133	spin_unlock_irqrestore(&send_queue->lock, flags);
2134
2135	mad_send_wc.send_buf = &mad_send_wr->send_buf;
2136	mad_send_wc.status = wc->status;
2137	mad_send_wc.vendor_err = wc->vendor_err;
2138	if (atomic_read(&qp_info->snoop_count))
2139		snoop_send(qp_info, &mad_send_wr->send_buf, &mad_send_wc,
2140			   IB_MAD_SNOOP_SEND_COMPLETIONS);
2141	ib_mad_complete_send_wr(mad_send_wr, &mad_send_wc);
2142
2143	if (queued_send_wr) {
2144		ret = ib_post_send(qp_info->qp, &queued_send_wr->send_wr,
2145				   &bad_send_wr);
2146		if (ret) {
2147			printk(KERN_ERR PFX "ib_post_send failed: %d\n", ret);
 
2148			mad_send_wr = queued_send_wr;
2149			wc->status = IB_WC_LOC_QP_OP_ERR;
2150			goto retry;
2151		}
2152	}
2153}
2154
2155static void mark_sends_for_retry(struct ib_mad_qp_info *qp_info)
2156{
2157	struct ib_mad_send_wr_private *mad_send_wr;
2158	struct ib_mad_list_head *mad_list;
2159	unsigned long flags;
2160
2161	spin_lock_irqsave(&qp_info->send_queue.lock, flags);
2162	list_for_each_entry(mad_list, &qp_info->send_queue.list, list) {
2163		mad_send_wr = container_of(mad_list,
2164					   struct ib_mad_send_wr_private,
2165					   mad_list);
2166		mad_send_wr->retry = 1;
2167	}
2168	spin_unlock_irqrestore(&qp_info->send_queue.lock, flags);
2169}
2170
2171static void mad_error_handler(struct ib_mad_port_private *port_priv,
2172			      struct ib_wc *wc)
2173{
2174	struct ib_mad_list_head *mad_list;
2175	struct ib_mad_qp_info *qp_info;
 
2176	struct ib_mad_send_wr_private *mad_send_wr;
2177	int ret;
2178
2179	/* Determine if failure was a send or receive */
2180	mad_list = (struct ib_mad_list_head *)(unsigned long)wc->wr_id;
2181	qp_info = mad_list->mad_queue->qp_info;
2182	if (mad_list->mad_queue == &qp_info->recv_queue)
2183		/*
2184		 * Receive errors indicate that the QP has entered the error
2185		 * state - error handling/shutdown code will cleanup
2186		 */
2187		return;
2188
2189	/*
2190	 * Send errors will transition the QP to SQE - move
2191	 * QP to RTS and repost flushed work requests
2192	 */
2193	mad_send_wr = container_of(mad_list, struct ib_mad_send_wr_private,
2194				   mad_list);
2195	if (wc->status == IB_WC_WR_FLUSH_ERR) {
2196		if (mad_send_wr->retry) {
2197			/* Repost send */
2198			struct ib_send_wr *bad_send_wr;
2199
2200			mad_send_wr->retry = 0;
2201			ret = ib_post_send(qp_info->qp, &mad_send_wr->send_wr,
2202					&bad_send_wr);
2203			if (ret)
2204				ib_mad_send_done_handler(port_priv, wc);
2205		} else
2206			ib_mad_send_done_handler(port_priv, wc);
2207	} else {
2208		struct ib_qp_attr *attr;
2209
2210		/* Transition QP to RTS and fail offending send */
2211		attr = kmalloc(sizeof *attr, GFP_KERNEL);
2212		if (attr) {
2213			attr->qp_state = IB_QPS_RTS;
2214			attr->cur_qp_state = IB_QPS_SQE;
2215			ret = ib_modify_qp(qp_info->qp, attr,
2216					   IB_QP_STATE | IB_QP_CUR_STATE);
2217			kfree(attr);
2218			if (ret)
2219				printk(KERN_ERR PFX "mad_error_handler - "
2220				       "ib_modify_qp to RTS : %d\n", ret);
 
2221			else
2222				mark_sends_for_retry(qp_info);
2223		}
2224		ib_mad_send_done_handler(port_priv, wc);
2225	}
2226}
2227
2228/*
2229 * IB MAD completion callback
2230 */
2231static void ib_mad_completion_handler(struct work_struct *work)
2232{
2233	struct ib_mad_port_private *port_priv;
2234	struct ib_wc wc;
2235
2236	port_priv = container_of(work, struct ib_mad_port_private, work);
2237	ib_req_notify_cq(port_priv->cq, IB_CQ_NEXT_COMP);
2238
2239	while (ib_poll_cq(port_priv->cq, 1, &wc) == 1) {
2240		if (wc.status == IB_WC_SUCCESS) {
2241			switch (wc.opcode) {
2242			case IB_WC_SEND:
2243				ib_mad_send_done_handler(port_priv, &wc);
2244				break;
2245			case IB_WC_RECV:
2246				ib_mad_recv_done_handler(port_priv, &wc);
2247				break;
2248			default:
2249				BUG_ON(1);
2250				break;
2251			}
2252		} else
2253			mad_error_handler(port_priv, &wc);
2254	}
2255}
2256
2257static void cancel_mads(struct ib_mad_agent_private *mad_agent_priv)
2258{
2259	unsigned long flags;
2260	struct ib_mad_send_wr_private *mad_send_wr, *temp_mad_send_wr;
2261	struct ib_mad_send_wc mad_send_wc;
2262	struct list_head cancel_list;
2263
2264	INIT_LIST_HEAD(&cancel_list);
2265
2266	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2267	list_for_each_entry_safe(mad_send_wr, temp_mad_send_wr,
2268				 &mad_agent_priv->send_list, agent_list) {
2269		if (mad_send_wr->status == IB_WC_SUCCESS) {
2270			mad_send_wr->status = IB_WC_WR_FLUSH_ERR;
2271			mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2272		}
2273	}
2274
2275	/* Empty wait list to prevent receives from finding a request */
2276	list_splice_init(&mad_agent_priv->wait_list, &cancel_list);
2277	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2278
2279	/* Report all cancelled requests */
2280	mad_send_wc.status = IB_WC_WR_FLUSH_ERR;
2281	mad_send_wc.vendor_err = 0;
2282
2283	list_for_each_entry_safe(mad_send_wr, temp_mad_send_wr,
2284				 &cancel_list, agent_list) {
2285		mad_send_wc.send_buf = &mad_send_wr->send_buf;
2286		list_del(&mad_send_wr->agent_list);
2287		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2288						   &mad_send_wc);
2289		atomic_dec(&mad_agent_priv->refcount);
2290	}
2291}
2292
2293static struct ib_mad_send_wr_private*
2294find_send_wr(struct ib_mad_agent_private *mad_agent_priv,
2295	     struct ib_mad_send_buf *send_buf)
2296{
2297	struct ib_mad_send_wr_private *mad_send_wr;
2298
2299	list_for_each_entry(mad_send_wr, &mad_agent_priv->wait_list,
2300			    agent_list) {
2301		if (&mad_send_wr->send_buf == send_buf)
2302			return mad_send_wr;
2303	}
2304
2305	list_for_each_entry(mad_send_wr, &mad_agent_priv->send_list,
2306			    agent_list) {
2307		if (is_data_mad(mad_agent_priv, mad_send_wr->send_buf.mad) &&
 
2308		    &mad_send_wr->send_buf == send_buf)
2309			return mad_send_wr;
2310	}
2311	return NULL;
2312}
2313
2314int ib_modify_mad(struct ib_mad_agent *mad_agent,
2315		  struct ib_mad_send_buf *send_buf, u32 timeout_ms)
2316{
2317	struct ib_mad_agent_private *mad_agent_priv;
2318	struct ib_mad_send_wr_private *mad_send_wr;
2319	unsigned long flags;
2320	int active;
2321
2322	mad_agent_priv = container_of(mad_agent, struct ib_mad_agent_private,
2323				      agent);
2324	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2325	mad_send_wr = find_send_wr(mad_agent_priv, send_buf);
2326	if (!mad_send_wr || mad_send_wr->status != IB_WC_SUCCESS) {
2327		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2328		return -EINVAL;
2329	}
2330
2331	active = (!mad_send_wr->timeout || mad_send_wr->refcount > 1);
2332	if (!timeout_ms) {
2333		mad_send_wr->status = IB_WC_WR_FLUSH_ERR;
2334		mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2335	}
2336
2337	mad_send_wr->send_buf.timeout_ms = timeout_ms;
2338	if (active)
2339		mad_send_wr->timeout = msecs_to_jiffies(timeout_ms);
2340	else
2341		ib_reset_mad_timeout(mad_send_wr, timeout_ms);
2342
2343	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2344	return 0;
2345}
2346EXPORT_SYMBOL(ib_modify_mad);
2347
2348void ib_cancel_mad(struct ib_mad_agent *mad_agent,
2349		   struct ib_mad_send_buf *send_buf)
2350{
2351	ib_modify_mad(mad_agent, send_buf, 0);
2352}
2353EXPORT_SYMBOL(ib_cancel_mad);
2354
2355static void local_completions(struct work_struct *work)
2356{
2357	struct ib_mad_agent_private *mad_agent_priv;
2358	struct ib_mad_local_private *local;
2359	struct ib_mad_agent_private *recv_mad_agent;
2360	unsigned long flags;
2361	int free_mad;
2362	struct ib_wc wc;
2363	struct ib_mad_send_wc mad_send_wc;
 
2364
2365	mad_agent_priv =
2366		container_of(work, struct ib_mad_agent_private, local_work);
2367
 
 
 
2368	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2369	while (!list_empty(&mad_agent_priv->local_list)) {
2370		local = list_entry(mad_agent_priv->local_list.next,
2371				   struct ib_mad_local_private,
2372				   completion_list);
2373		list_del(&local->completion_list);
2374		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2375		free_mad = 0;
2376		if (local->mad_priv) {
 
2377			recv_mad_agent = local->recv_mad_agent;
2378			if (!recv_mad_agent) {
2379				printk(KERN_ERR PFX "No receive MAD agent for local completion\n");
 
2380				free_mad = 1;
2381				goto local_send_completion;
2382			}
2383
2384			/*
2385			 * Defined behavior is to complete response
2386			 * before request
2387			 */
2388			build_smp_wc(recv_mad_agent->agent.qp,
2389				     (unsigned long) local->mad_send_wr,
2390				     be16_to_cpu(IB_LID_PERMISSIVE),
2391				     0, recv_mad_agent->agent.port_num, &wc);
 
2392
2393			local->mad_priv->header.recv_wc.wc = &wc;
2394			local->mad_priv->header.recv_wc.mad_len =
2395						sizeof(struct ib_mad);
 
 
 
 
 
 
 
 
2396			INIT_LIST_HEAD(&local->mad_priv->header.recv_wc.rmpp_list);
2397			list_add(&local->mad_priv->header.recv_wc.recv_buf.list,
2398				 &local->mad_priv->header.recv_wc.rmpp_list);
2399			local->mad_priv->header.recv_wc.recv_buf.grh = NULL;
2400			local->mad_priv->header.recv_wc.recv_buf.mad =
2401						&local->mad_priv->mad.mad;
2402			if (atomic_read(&recv_mad_agent->qp_info->snoop_count))
2403				snoop_recv(recv_mad_agent->qp_info,
2404					  &local->mad_priv->header.recv_wc,
2405					   IB_MAD_SNOOP_RECVS);
2406			recv_mad_agent->agent.recv_handler(
2407						&recv_mad_agent->agent,
 
2408						&local->mad_priv->header.recv_wc);
2409			spin_lock_irqsave(&recv_mad_agent->lock, flags);
2410			atomic_dec(&recv_mad_agent->refcount);
2411			spin_unlock_irqrestore(&recv_mad_agent->lock, flags);
2412		}
2413
2414local_send_completion:
2415		/* Complete send */
2416		mad_send_wc.status = IB_WC_SUCCESS;
2417		mad_send_wc.vendor_err = 0;
2418		mad_send_wc.send_buf = &local->mad_send_wr->send_buf;
2419		if (atomic_read(&mad_agent_priv->qp_info->snoop_count))
2420			snoop_send(mad_agent_priv->qp_info,
2421				   &local->mad_send_wr->send_buf,
2422				   &mad_send_wc, IB_MAD_SNOOP_SEND_COMPLETIONS);
2423		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2424						   &mad_send_wc);
2425
2426		spin_lock_irqsave(&mad_agent_priv->lock, flags);
2427		atomic_dec(&mad_agent_priv->refcount);
2428		if (free_mad)
2429			kmem_cache_free(ib_mad_cache, local->mad_priv);
2430		kfree(local);
2431	}
2432	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2433}
2434
2435static int retry_send(struct ib_mad_send_wr_private *mad_send_wr)
2436{
2437	int ret;
2438
2439	if (!mad_send_wr->retries_left)
2440		return -ETIMEDOUT;
2441
2442	mad_send_wr->retries_left--;
2443	mad_send_wr->send_buf.retries++;
2444
2445	mad_send_wr->timeout = msecs_to_jiffies(mad_send_wr->send_buf.timeout_ms);
2446
2447	if (mad_send_wr->mad_agent_priv->agent.rmpp_version) {
2448		ret = ib_retry_rmpp(mad_send_wr);
2449		switch (ret) {
2450		case IB_RMPP_RESULT_UNHANDLED:
2451			ret = ib_send_mad(mad_send_wr);
2452			break;
2453		case IB_RMPP_RESULT_CONSUMED:
2454			ret = 0;
2455			break;
2456		default:
2457			ret = -ECOMM;
2458			break;
2459		}
2460	} else
2461		ret = ib_send_mad(mad_send_wr);
2462
2463	if (!ret) {
2464		mad_send_wr->refcount++;
2465		list_add_tail(&mad_send_wr->agent_list,
2466			      &mad_send_wr->mad_agent_priv->send_list);
2467	}
2468	return ret;
2469}
2470
2471static void timeout_sends(struct work_struct *work)
2472{
2473	struct ib_mad_agent_private *mad_agent_priv;
2474	struct ib_mad_send_wr_private *mad_send_wr;
2475	struct ib_mad_send_wc mad_send_wc;
2476	unsigned long flags, delay;
2477
2478	mad_agent_priv = container_of(work, struct ib_mad_agent_private,
2479				      timed_work.work);
2480	mad_send_wc.vendor_err = 0;
2481
2482	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2483	while (!list_empty(&mad_agent_priv->wait_list)) {
2484		mad_send_wr = list_entry(mad_agent_priv->wait_list.next,
2485					 struct ib_mad_send_wr_private,
2486					 agent_list);
2487
2488		if (time_after(mad_send_wr->timeout, jiffies)) {
2489			delay = mad_send_wr->timeout - jiffies;
2490			if ((long)delay <= 0)
2491				delay = 1;
2492			queue_delayed_work(mad_agent_priv->qp_info->
2493					   port_priv->wq,
2494					   &mad_agent_priv->timed_work, delay);
2495			break;
2496		}
2497
2498		list_del(&mad_send_wr->agent_list);
2499		if (mad_send_wr->status == IB_WC_SUCCESS &&
2500		    !retry_send(mad_send_wr))
2501			continue;
2502
2503		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2504
2505		if (mad_send_wr->status == IB_WC_SUCCESS)
2506			mad_send_wc.status = IB_WC_RESP_TIMEOUT_ERR;
2507		else
2508			mad_send_wc.status = mad_send_wr->status;
2509		mad_send_wc.send_buf = &mad_send_wr->send_buf;
2510		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2511						   &mad_send_wc);
2512
2513		atomic_dec(&mad_agent_priv->refcount);
2514		spin_lock_irqsave(&mad_agent_priv->lock, flags);
2515	}
2516	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2517}
2518
2519static void ib_mad_thread_completion_handler(struct ib_cq *cq, void *arg)
2520{
2521	struct ib_mad_port_private *port_priv = cq->cq_context;
2522	unsigned long flags;
2523
2524	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2525	if (!list_empty(&port_priv->port_list))
2526		queue_work(port_priv->wq, &port_priv->work);
2527	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2528}
2529
2530/*
2531 * Allocate receive MADs and post receive WRs for them
2532 */
2533static int ib_mad_post_receive_mads(struct ib_mad_qp_info *qp_info,
2534				    struct ib_mad_private *mad)
2535{
2536	unsigned long flags;
2537	int post, ret;
2538	struct ib_mad_private *mad_priv;
2539	struct ib_sge sg_list;
2540	struct ib_recv_wr recv_wr, *bad_recv_wr;
2541	struct ib_mad_queue *recv_queue = &qp_info->recv_queue;
2542
2543	/* Initialize common scatter list fields */
2544	sg_list.length = sizeof *mad_priv - sizeof mad_priv->header;
2545	sg_list.lkey = (*qp_info->port_priv->mr).lkey;
2546
2547	/* Initialize common receive WR fields */
2548	recv_wr.next = NULL;
2549	recv_wr.sg_list = &sg_list;
2550	recv_wr.num_sge = 1;
2551
2552	do {
2553		/* Allocate and map receive buffer */
2554		if (mad) {
2555			mad_priv = mad;
2556			mad = NULL;
2557		} else {
2558			mad_priv = kmem_cache_alloc(ib_mad_cache, GFP_KERNEL);
 
2559			if (!mad_priv) {
2560				printk(KERN_ERR PFX "No memory for receive buffer\n");
2561				ret = -ENOMEM;
2562				break;
2563			}
2564		}
 
2565		sg_list.addr = ib_dma_map_single(qp_info->port_priv->device,
2566						 &mad_priv->grh,
2567						 sizeof *mad_priv -
2568						   sizeof mad_priv->header,
2569						 DMA_FROM_DEVICE);
 
 
 
 
 
2570		mad_priv->header.mapping = sg_list.addr;
2571		recv_wr.wr_id = (unsigned long)&mad_priv->header.mad_list;
2572		mad_priv->header.mad_list.mad_queue = recv_queue;
 
 
2573
2574		/* Post receive WR */
2575		spin_lock_irqsave(&recv_queue->lock, flags);
2576		post = (++recv_queue->count < recv_queue->max_active);
2577		list_add_tail(&mad_priv->header.mad_list.list, &recv_queue->list);
2578		spin_unlock_irqrestore(&recv_queue->lock, flags);
2579		ret = ib_post_recv(qp_info->qp, &recv_wr, &bad_recv_wr);
2580		if (ret) {
2581			spin_lock_irqsave(&recv_queue->lock, flags);
2582			list_del(&mad_priv->header.mad_list.list);
2583			recv_queue->count--;
2584			spin_unlock_irqrestore(&recv_queue->lock, flags);
2585			ib_dma_unmap_single(qp_info->port_priv->device,
2586					    mad_priv->header.mapping,
2587					    sizeof *mad_priv -
2588					      sizeof mad_priv->header,
2589					    DMA_FROM_DEVICE);
2590			kmem_cache_free(ib_mad_cache, mad_priv);
2591			printk(KERN_ERR PFX "ib_post_recv failed: %d\n", ret);
 
2592			break;
2593		}
2594	} while (post);
2595
2596	return ret;
2597}
2598
2599/*
2600 * Return all the posted receive MADs
2601 */
2602static void cleanup_recv_queue(struct ib_mad_qp_info *qp_info)
2603{
2604	struct ib_mad_private_header *mad_priv_hdr;
2605	struct ib_mad_private *recv;
2606	struct ib_mad_list_head *mad_list;
2607
2608	if (!qp_info->qp)
2609		return;
2610
2611	while (!list_empty(&qp_info->recv_queue.list)) {
2612
2613		mad_list = list_entry(qp_info->recv_queue.list.next,
2614				      struct ib_mad_list_head, list);
2615		mad_priv_hdr = container_of(mad_list,
2616					    struct ib_mad_private_header,
2617					    mad_list);
2618		recv = container_of(mad_priv_hdr, struct ib_mad_private,
2619				    header);
2620
2621		/* Remove from posted receive MAD list */
2622		list_del(&mad_list->list);
2623
2624		ib_dma_unmap_single(qp_info->port_priv->device,
2625				    recv->header.mapping,
2626				    sizeof(struct ib_mad_private) -
2627				      sizeof(struct ib_mad_private_header),
2628				    DMA_FROM_DEVICE);
2629		kmem_cache_free(ib_mad_cache, recv);
2630	}
2631
2632	qp_info->recv_queue.count = 0;
2633}
2634
2635/*
2636 * Start the port
2637 */
2638static int ib_mad_port_start(struct ib_mad_port_private *port_priv)
2639{
2640	int ret, i;
2641	struct ib_qp_attr *attr;
2642	struct ib_qp *qp;
 
2643
2644	attr = kmalloc(sizeof *attr, GFP_KERNEL);
2645	if (!attr) {
2646		printk(KERN_ERR PFX "Couldn't kmalloc ib_qp_attr\n");
2647		return -ENOMEM;
2648	}
 
 
 
 
2649
2650	for (i = 0; i < IB_MAD_QPS_CORE; i++) {
2651		qp = port_priv->qp_info[i].qp;
2652		if (!qp)
2653			continue;
2654
2655		/*
2656		 * PKey index for QP1 is irrelevant but
2657		 * one is needed for the Reset to Init transition
2658		 */
2659		attr->qp_state = IB_QPS_INIT;
2660		attr->pkey_index = 0;
2661		attr->qkey = (qp->qp_num == 0) ? 0 : IB_QP1_QKEY;
2662		ret = ib_modify_qp(qp, attr, IB_QP_STATE |
2663					     IB_QP_PKEY_INDEX | IB_QP_QKEY);
2664		if (ret) {
2665			printk(KERN_ERR PFX "Couldn't change QP%d state to "
2666			       "INIT: %d\n", i, ret);
 
2667			goto out;
2668		}
2669
2670		attr->qp_state = IB_QPS_RTR;
2671		ret = ib_modify_qp(qp, attr, IB_QP_STATE);
2672		if (ret) {
2673			printk(KERN_ERR PFX "Couldn't change QP%d state to "
2674			       "RTR: %d\n", i, ret);
 
2675			goto out;
2676		}
2677
2678		attr->qp_state = IB_QPS_RTS;
2679		attr->sq_psn = IB_MAD_SEND_Q_PSN;
2680		ret = ib_modify_qp(qp, attr, IB_QP_STATE | IB_QP_SQ_PSN);
2681		if (ret) {
2682			printk(KERN_ERR PFX "Couldn't change QP%d state to "
2683			       "RTS: %d\n", i, ret);
 
2684			goto out;
2685		}
2686	}
2687
2688	ret = ib_req_notify_cq(port_priv->cq, IB_CQ_NEXT_COMP);
2689	if (ret) {
2690		printk(KERN_ERR PFX "Failed to request completion "
2691		       "notification: %d\n", ret);
 
2692		goto out;
2693	}
2694
2695	for (i = 0; i < IB_MAD_QPS_CORE; i++) {
2696		if (!port_priv->qp_info[i].qp)
2697			continue;
2698
2699		ret = ib_mad_post_receive_mads(&port_priv->qp_info[i], NULL);
2700		if (ret) {
2701			printk(KERN_ERR PFX "Couldn't post receive WRs\n");
 
2702			goto out;
2703		}
2704	}
2705out:
2706	kfree(attr);
2707	return ret;
2708}
2709
2710static void qp_event_handler(struct ib_event *event, void *qp_context)
2711{
2712	struct ib_mad_qp_info	*qp_info = qp_context;
2713
2714	/* It's worse than that! He's dead, Jim! */
2715	printk(KERN_ERR PFX "Fatal error (%d) on MAD QP (%d)\n",
 
2716		event->event, qp_info->qp->qp_num);
2717}
2718
2719static void init_mad_queue(struct ib_mad_qp_info *qp_info,
2720			   struct ib_mad_queue *mad_queue)
2721{
2722	mad_queue->qp_info = qp_info;
2723	mad_queue->count = 0;
2724	spin_lock_init(&mad_queue->lock);
2725	INIT_LIST_HEAD(&mad_queue->list);
2726}
2727
2728static void init_mad_qp(struct ib_mad_port_private *port_priv,
2729			struct ib_mad_qp_info *qp_info)
2730{
2731	qp_info->port_priv = port_priv;
2732	init_mad_queue(qp_info, &qp_info->send_queue);
2733	init_mad_queue(qp_info, &qp_info->recv_queue);
2734	INIT_LIST_HEAD(&qp_info->overflow_list);
2735	spin_lock_init(&qp_info->snoop_lock);
2736	qp_info->snoop_table = NULL;
2737	qp_info->snoop_table_size = 0;
2738	atomic_set(&qp_info->snoop_count, 0);
2739}
2740
2741static int create_mad_qp(struct ib_mad_qp_info *qp_info,
2742			 enum ib_qp_type qp_type)
2743{
2744	struct ib_qp_init_attr	qp_init_attr;
2745	int ret;
2746
2747	memset(&qp_init_attr, 0, sizeof qp_init_attr);
2748	qp_init_attr.send_cq = qp_info->port_priv->cq;
2749	qp_init_attr.recv_cq = qp_info->port_priv->cq;
2750	qp_init_attr.sq_sig_type = IB_SIGNAL_ALL_WR;
2751	qp_init_attr.cap.max_send_wr = mad_sendq_size;
2752	qp_init_attr.cap.max_recv_wr = mad_recvq_size;
2753	qp_init_attr.cap.max_send_sge = IB_MAD_SEND_REQ_MAX_SG;
2754	qp_init_attr.cap.max_recv_sge = IB_MAD_RECV_REQ_MAX_SG;
2755	qp_init_attr.qp_type = qp_type;
2756	qp_init_attr.port_num = qp_info->port_priv->port_num;
2757	qp_init_attr.qp_context = qp_info;
2758	qp_init_attr.event_handler = qp_event_handler;
2759	qp_info->qp = ib_create_qp(qp_info->port_priv->pd, &qp_init_attr);
2760	if (IS_ERR(qp_info->qp)) {
2761		printk(KERN_ERR PFX "Couldn't create ib_mad QP%d\n",
2762		       get_spl_qp_index(qp_type));
 
2763		ret = PTR_ERR(qp_info->qp);
2764		goto error;
2765	}
2766	/* Use minimum queue sizes unless the CQ is resized */
2767	qp_info->send_queue.max_active = mad_sendq_size;
2768	qp_info->recv_queue.max_active = mad_recvq_size;
2769	return 0;
2770
2771error:
2772	return ret;
2773}
2774
2775static void destroy_mad_qp(struct ib_mad_qp_info *qp_info)
2776{
2777	if (!qp_info->qp)
2778		return;
2779
2780	ib_destroy_qp(qp_info->qp);
2781	kfree(qp_info->snoop_table);
2782}
2783
2784/*
2785 * Open the port
2786 * Create the QP, PD, MR, and CQ if needed
2787 */
2788static int ib_mad_port_open(struct ib_device *device,
2789			    int port_num)
2790{
2791	int ret, cq_size;
2792	struct ib_mad_port_private *port_priv;
2793	unsigned long flags;
2794	char name[sizeof "ib_mad123"];
2795	int has_smi;
2796
 
 
 
 
 
 
 
2797	/* Create new device info */
2798	port_priv = kzalloc(sizeof *port_priv, GFP_KERNEL);
2799	if (!port_priv) {
2800		printk(KERN_ERR PFX "No memory for ib_mad_port_private\n");
2801		return -ENOMEM;
2802	}
2803
2804	port_priv->device = device;
2805	port_priv->port_num = port_num;
2806	spin_lock_init(&port_priv->reg_lock);
2807	INIT_LIST_HEAD(&port_priv->agent_list);
2808	init_mad_qp(port_priv, &port_priv->qp_info[0]);
2809	init_mad_qp(port_priv, &port_priv->qp_info[1]);
2810
2811	cq_size = mad_sendq_size + mad_recvq_size;
2812	has_smi = rdma_port_get_link_layer(device, port_num) == IB_LINK_LAYER_INFINIBAND;
2813	if (has_smi)
2814		cq_size *= 2;
2815
2816	port_priv->cq = ib_create_cq(port_priv->device,
2817				     ib_mad_thread_completion_handler,
2818				     NULL, port_priv, cq_size, 0);
2819	if (IS_ERR(port_priv->cq)) {
2820		printk(KERN_ERR PFX "Couldn't create ib_mad CQ\n");
2821		ret = PTR_ERR(port_priv->cq);
2822		goto error3;
2823	}
2824
2825	port_priv->pd = ib_alloc_pd(device);
2826	if (IS_ERR(port_priv->pd)) {
2827		printk(KERN_ERR PFX "Couldn't create ib_mad PD\n");
2828		ret = PTR_ERR(port_priv->pd);
2829		goto error4;
2830	}
2831
2832	port_priv->mr = ib_get_dma_mr(port_priv->pd, IB_ACCESS_LOCAL_WRITE);
2833	if (IS_ERR(port_priv->mr)) {
2834		printk(KERN_ERR PFX "Couldn't get ib_mad DMA MR\n");
2835		ret = PTR_ERR(port_priv->mr);
2836		goto error5;
2837	}
2838
2839	if (has_smi) {
2840		ret = create_mad_qp(&port_priv->qp_info[0], IB_QPT_SMI);
2841		if (ret)
2842			goto error6;
2843	}
2844	ret = create_mad_qp(&port_priv->qp_info[1], IB_QPT_GSI);
2845	if (ret)
2846		goto error7;
2847
2848	snprintf(name, sizeof name, "ib_mad%d", port_num);
2849	port_priv->wq = create_singlethread_workqueue(name);
2850	if (!port_priv->wq) {
2851		ret = -ENOMEM;
2852		goto error8;
2853	}
2854	INIT_WORK(&port_priv->work, ib_mad_completion_handler);
2855
2856	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2857	list_add_tail(&port_priv->port_list, &ib_mad_port_list);
2858	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2859
2860	ret = ib_mad_port_start(port_priv);
2861	if (ret) {
2862		printk(KERN_ERR PFX "Couldn't start port\n");
2863		goto error9;
2864	}
2865
2866	return 0;
2867
2868error9:
2869	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2870	list_del_init(&port_priv->port_list);
2871	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2872
2873	destroy_workqueue(port_priv->wq);
2874error8:
2875	destroy_mad_qp(&port_priv->qp_info[1]);
2876error7:
2877	destroy_mad_qp(&port_priv->qp_info[0]);
2878error6:
2879	ib_dereg_mr(port_priv->mr);
2880error5:
2881	ib_dealloc_pd(port_priv->pd);
2882error4:
2883	ib_destroy_cq(port_priv->cq);
2884	cleanup_recv_queue(&port_priv->qp_info[1]);
2885	cleanup_recv_queue(&port_priv->qp_info[0]);
2886error3:
2887	kfree(port_priv);
2888
2889	return ret;
2890}
2891
2892/*
2893 * Close the port
2894 * If there are no classes using the port, free the port
2895 * resources (CQ, MR, PD, QP) and remove the port's info structure
2896 */
2897static int ib_mad_port_close(struct ib_device *device, int port_num)
2898{
2899	struct ib_mad_port_private *port_priv;
2900	unsigned long flags;
2901
2902	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2903	port_priv = __ib_get_mad_port(device, port_num);
2904	if (port_priv == NULL) {
2905		spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2906		printk(KERN_ERR PFX "Port %d not found\n", port_num);
2907		return -ENODEV;
2908	}
2909	list_del_init(&port_priv->port_list);
2910	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2911
2912	destroy_workqueue(port_priv->wq);
2913	destroy_mad_qp(&port_priv->qp_info[1]);
2914	destroy_mad_qp(&port_priv->qp_info[0]);
2915	ib_dereg_mr(port_priv->mr);
2916	ib_dealloc_pd(port_priv->pd);
2917	ib_destroy_cq(port_priv->cq);
2918	cleanup_recv_queue(&port_priv->qp_info[1]);
2919	cleanup_recv_queue(&port_priv->qp_info[0]);
2920	/* XXX: Handle deallocation of MAD registration tables */
2921
2922	kfree(port_priv);
2923
2924	return 0;
2925}
2926
2927static void ib_mad_init_device(struct ib_device *device)
2928{
2929	int start, end, i;
2930
2931	if (rdma_node_get_transport(device->node_type) != RDMA_TRANSPORT_IB)
2932		return;
2933
2934	if (device->node_type == RDMA_NODE_IB_SWITCH) {
2935		start = 0;
2936		end   = 0;
2937	} else {
2938		start = 1;
2939		end   = device->phys_port_cnt;
2940	}
2941
2942	for (i = start; i <= end; i++) {
2943		if (ib_mad_port_open(device, i)) {
2944			printk(KERN_ERR PFX "Couldn't open %s port %d\n",
2945			       device->name, i);
2946			goto error;
2947		}
2948		if (ib_agent_port_open(device, i)) {
2949			printk(KERN_ERR PFX "Couldn't open %s port %d "
2950			       "for agents\n",
2951			       device->name, i);
2952			goto error_agent;
2953		}
2954	}
2955	return;
2956
2957error_agent:
2958	if (ib_mad_port_close(device, i))
2959		printk(KERN_ERR PFX "Couldn't close %s port %d\n",
2960		       device->name, i);
2961
2962error:
2963	i--;
 
 
2964
2965	while (i >= start) {
2966		if (ib_agent_port_close(device, i))
2967			printk(KERN_ERR PFX "Couldn't close %s port %d "
2968			       "for agents\n",
2969			       device->name, i);
2970		if (ib_mad_port_close(device, i))
2971			printk(KERN_ERR PFX "Couldn't close %s port %d\n",
2972			       device->name, i);
2973		i--;
2974	}
2975}
2976
2977static void ib_mad_remove_device(struct ib_device *device)
2978{
2979	int i, num_ports, cur_port;
2980
2981	if (rdma_node_get_transport(device->node_type) != RDMA_TRANSPORT_IB)
2982		return;
 
2983
2984	if (device->node_type == RDMA_NODE_IB_SWITCH) {
2985		num_ports = 1;
2986		cur_port = 0;
2987	} else {
2988		num_ports = device->phys_port_cnt;
2989		cur_port = 1;
2990	}
2991	for (i = 0; i < num_ports; i++, cur_port++) {
2992		if (ib_agent_port_close(device, cur_port))
2993			printk(KERN_ERR PFX "Couldn't close %s port %d "
2994			       "for agents\n",
2995			       device->name, cur_port);
2996		if (ib_mad_port_close(device, cur_port))
2997			printk(KERN_ERR PFX "Couldn't close %s port %d\n",
2998			       device->name, cur_port);
2999	}
3000}
3001
3002static struct ib_client mad_client = {
3003	.name   = "mad",
3004	.add = ib_mad_init_device,
3005	.remove = ib_mad_remove_device
3006};
3007
3008static int __init ib_mad_init_module(void)
3009{
3010	int ret;
3011
3012	mad_recvq_size = min(mad_recvq_size, IB_MAD_QP_MAX_SIZE);
3013	mad_recvq_size = max(mad_recvq_size, IB_MAD_QP_MIN_SIZE);
3014
3015	mad_sendq_size = min(mad_sendq_size, IB_MAD_QP_MAX_SIZE);
3016	mad_sendq_size = max(mad_sendq_size, IB_MAD_QP_MIN_SIZE);
3017
3018	ib_mad_cache = kmem_cache_create("ib_mad",
3019					 sizeof(struct ib_mad_private),
3020					 0,
3021					 SLAB_HWCACHE_ALIGN,
3022					 NULL);
3023	if (!ib_mad_cache) {
3024		printk(KERN_ERR PFX "Couldn't create ib_mad cache\n");
3025		ret = -ENOMEM;
3026		goto error1;
3027	}
3028
3029	INIT_LIST_HEAD(&ib_mad_port_list);
3030
3031	if (ib_register_client(&mad_client)) {
3032		printk(KERN_ERR PFX "Couldn't register ib_mad client\n");
3033		ret = -EINVAL;
3034		goto error2;
3035	}
3036
3037	return 0;
3038
3039error2:
3040	kmem_cache_destroy(ib_mad_cache);
3041error1:
3042	return ret;
3043}
3044
3045static void __exit ib_mad_cleanup_module(void)
3046{
3047	ib_unregister_client(&mad_client);
3048	kmem_cache_destroy(ib_mad_cache);
3049}
3050
3051module_init(ib_mad_init_module);
3052module_exit(ib_mad_cleanup_module);
v4.17
   1/*
   2 * Copyright (c) 2004-2007 Voltaire, Inc. All rights reserved.
   3 * Copyright (c) 2005 Intel Corporation.  All rights reserved.
   4 * Copyright (c) 2005 Mellanox Technologies Ltd.  All rights reserved.
   5 * Copyright (c) 2009 HNR Consulting. All rights reserved.
   6 * Copyright (c) 2014 Intel Corporation.  All rights reserved.
   7 *
   8 * This software is available to you under a choice of one of two
   9 * licenses.  You may choose to be licensed under the terms of the GNU
  10 * General Public License (GPL) Version 2, available from the file
  11 * COPYING in the main directory of this source tree, or the
  12 * OpenIB.org BSD license below:
  13 *
  14 *     Redistribution and use in source and binary forms, with or
  15 *     without modification, are permitted provided that the following
  16 *     conditions are met:
  17 *
  18 *      - Redistributions of source code must retain the above
  19 *        copyright notice, this list of conditions and the following
  20 *        disclaimer.
  21 *
  22 *      - Redistributions in binary form must reproduce the above
  23 *        copyright notice, this list of conditions and the following
  24 *        disclaimer in the documentation and/or other materials
  25 *        provided with the distribution.
  26 *
  27 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  28 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  29 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  30 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  31 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  32 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  33 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  34 * SOFTWARE.
  35 *
  36 */
  37
  38#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  39
  40#include <linux/dma-mapping.h>
  41#include <linux/slab.h>
  42#include <linux/module.h>
  43#include <linux/security.h>
  44#include <rdma/ib_cache.h>
  45
  46#include "mad_priv.h"
  47#include "core_priv.h"
  48#include "mad_rmpp.h"
  49#include "smi.h"
  50#include "opa_smi.h"
  51#include "agent.h"
  52
 
 
 
 
 
  53static int mad_sendq_size = IB_MAD_QP_SEND_SIZE;
  54static int mad_recvq_size = IB_MAD_QP_RECV_SIZE;
  55
  56module_param_named(send_queue_size, mad_sendq_size, int, 0444);
  57MODULE_PARM_DESC(send_queue_size, "Size of send queue in number of work requests");
  58module_param_named(recv_queue_size, mad_recvq_size, int, 0444);
  59MODULE_PARM_DESC(recv_queue_size, "Size of receive queue in number of work requests");
  60
 
 
  61static struct list_head ib_mad_port_list;
  62static atomic_t ib_mad_client_id = ATOMIC_INIT(0);
  63
  64/* Port list lock */
  65static DEFINE_SPINLOCK(ib_mad_port_list_lock);
  66
  67/* Forward declarations */
  68static int method_in_use(struct ib_mad_mgmt_method_table **method,
  69			 struct ib_mad_reg_req *mad_reg_req);
  70static void remove_mad_reg_req(struct ib_mad_agent_private *priv);
  71static struct ib_mad_agent_private *find_mad_agent(
  72					struct ib_mad_port_private *port_priv,
  73					const struct ib_mad_hdr *mad);
  74static int ib_mad_post_receive_mads(struct ib_mad_qp_info *qp_info,
  75				    struct ib_mad_private *mad);
  76static void cancel_mads(struct ib_mad_agent_private *mad_agent_priv);
  77static void timeout_sends(struct work_struct *work);
  78static void local_completions(struct work_struct *work);
  79static int add_nonoui_reg_req(struct ib_mad_reg_req *mad_reg_req,
  80			      struct ib_mad_agent_private *agent_priv,
  81			      u8 mgmt_class);
  82static int add_oui_reg_req(struct ib_mad_reg_req *mad_reg_req,
  83			   struct ib_mad_agent_private *agent_priv);
  84static bool ib_mad_send_error(struct ib_mad_port_private *port_priv,
  85			      struct ib_wc *wc);
  86static void ib_mad_send_done(struct ib_cq *cq, struct ib_wc *wc);
  87
  88/*
  89 * Returns a ib_mad_port_private structure or NULL for a device/port
  90 * Assumes ib_mad_port_list_lock is being held
  91 */
  92static inline struct ib_mad_port_private *
  93__ib_get_mad_port(struct ib_device *device, int port_num)
  94{
  95	struct ib_mad_port_private *entry;
  96
  97	list_for_each_entry(entry, &ib_mad_port_list, port_list) {
  98		if (entry->device == device && entry->port_num == port_num)
  99			return entry;
 100	}
 101	return NULL;
 102}
 103
 104/*
 105 * Wrapper function to return a ib_mad_port_private structure or NULL
 106 * for a device/port
 107 */
 108static inline struct ib_mad_port_private *
 109ib_get_mad_port(struct ib_device *device, int port_num)
 110{
 111	struct ib_mad_port_private *entry;
 112	unsigned long flags;
 113
 114	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
 115	entry = __ib_get_mad_port(device, port_num);
 116	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
 117
 118	return entry;
 119}
 120
 121static inline u8 convert_mgmt_class(u8 mgmt_class)
 122{
 123	/* Alias IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE to 0 */
 124	return mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE ?
 125		0 : mgmt_class;
 126}
 127
 128static int get_spl_qp_index(enum ib_qp_type qp_type)
 129{
 130	switch (qp_type)
 131	{
 132	case IB_QPT_SMI:
 133		return 0;
 134	case IB_QPT_GSI:
 135		return 1;
 136	default:
 137		return -1;
 138	}
 139}
 140
 141static int vendor_class_index(u8 mgmt_class)
 142{
 143	return mgmt_class - IB_MGMT_CLASS_VENDOR_RANGE2_START;
 144}
 145
 146static int is_vendor_class(u8 mgmt_class)
 147{
 148	if ((mgmt_class < IB_MGMT_CLASS_VENDOR_RANGE2_START) ||
 149	    (mgmt_class > IB_MGMT_CLASS_VENDOR_RANGE2_END))
 150		return 0;
 151	return 1;
 152}
 153
 154static int is_vendor_oui(char *oui)
 155{
 156	if (oui[0] || oui[1] || oui[2])
 157		return 1;
 158	return 0;
 159}
 160
 161static int is_vendor_method_in_use(
 162		struct ib_mad_mgmt_vendor_class *vendor_class,
 163		struct ib_mad_reg_req *mad_reg_req)
 164{
 165	struct ib_mad_mgmt_method_table *method;
 166	int i;
 167
 168	for (i = 0; i < MAX_MGMT_OUI; i++) {
 169		if (!memcmp(vendor_class->oui[i], mad_reg_req->oui, 3)) {
 170			method = vendor_class->method_table[i];
 171			if (method) {
 172				if (method_in_use(&method, mad_reg_req))
 173					return 1;
 174				else
 175					break;
 176			}
 177		}
 178	}
 179	return 0;
 180}
 181
 182int ib_response_mad(const struct ib_mad_hdr *hdr)
 183{
 184	return ((hdr->method & IB_MGMT_METHOD_RESP) ||
 185		(hdr->method == IB_MGMT_METHOD_TRAP_REPRESS) ||
 186		((hdr->mgmt_class == IB_MGMT_CLASS_BM) &&
 187		 (hdr->attr_mod & IB_BM_ATTR_MOD_RESP)));
 188}
 189EXPORT_SYMBOL(ib_response_mad);
 190
 191/*
 192 * ib_register_mad_agent - Register to send/receive MADs
 193 */
 194struct ib_mad_agent *ib_register_mad_agent(struct ib_device *device,
 195					   u8 port_num,
 196					   enum ib_qp_type qp_type,
 197					   struct ib_mad_reg_req *mad_reg_req,
 198					   u8 rmpp_version,
 199					   ib_mad_send_handler send_handler,
 200					   ib_mad_recv_handler recv_handler,
 201					   void *context,
 202					   u32 registration_flags)
 203{
 204	struct ib_mad_port_private *port_priv;
 205	struct ib_mad_agent *ret = ERR_PTR(-EINVAL);
 206	struct ib_mad_agent_private *mad_agent_priv;
 207	struct ib_mad_reg_req *reg_req = NULL;
 208	struct ib_mad_mgmt_class_table *class;
 209	struct ib_mad_mgmt_vendor_class_table *vendor;
 210	struct ib_mad_mgmt_vendor_class *vendor_class;
 211	struct ib_mad_mgmt_method_table *method;
 212	int ret2, qpn;
 213	unsigned long flags;
 214	u8 mgmt_class, vclass;
 215
 216	/* Validate parameters */
 217	qpn = get_spl_qp_index(qp_type);
 218	if (qpn == -1) {
 219		dev_notice(&device->dev,
 220			   "ib_register_mad_agent: invalid QP Type %d\n",
 221			   qp_type);
 222		goto error1;
 223	}
 224
 225	if (rmpp_version && rmpp_version != IB_MGMT_RMPP_VERSION) {
 226		dev_notice(&device->dev,
 227			   "ib_register_mad_agent: invalid RMPP Version %u\n",
 228			   rmpp_version);
 229		goto error1;
 230	}
 231
 232	/* Validate MAD registration request if supplied */
 233	if (mad_reg_req) {
 234		if (mad_reg_req->mgmt_class_version >= MAX_MGMT_VERSION) {
 235			dev_notice(&device->dev,
 236				   "ib_register_mad_agent: invalid Class Version %u\n",
 237				   mad_reg_req->mgmt_class_version);
 238			goto error1;
 239		}
 240		if (!recv_handler) {
 241			dev_notice(&device->dev,
 242				   "ib_register_mad_agent: no recv_handler\n");
 243			goto error1;
 244		}
 245		if (mad_reg_req->mgmt_class >= MAX_MGMT_CLASS) {
 246			/*
 247			 * IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE is the only
 248			 * one in this range currently allowed
 249			 */
 250			if (mad_reg_req->mgmt_class !=
 251			    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE) {
 252				dev_notice(&device->dev,
 253					   "ib_register_mad_agent: Invalid Mgmt Class 0x%x\n",
 254					   mad_reg_req->mgmt_class);
 255				goto error1;
 256			}
 257		} else if (mad_reg_req->mgmt_class == 0) {
 258			/*
 259			 * Class 0 is reserved in IBA and is used for
 260			 * aliasing of IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE
 261			 */
 262			dev_notice(&device->dev,
 263				   "ib_register_mad_agent: Invalid Mgmt Class 0\n");
 264			goto error1;
 265		} else if (is_vendor_class(mad_reg_req->mgmt_class)) {
 266			/*
 267			 * If class is in "new" vendor range,
 268			 * ensure supplied OUI is not zero
 269			 */
 270			if (!is_vendor_oui(mad_reg_req->oui)) {
 271				dev_notice(&device->dev,
 272					   "ib_register_mad_agent: No OUI specified for class 0x%x\n",
 273					   mad_reg_req->mgmt_class);
 274				goto error1;
 275			}
 276		}
 277		/* Make sure class supplied is consistent with RMPP */
 278		if (!ib_is_mad_class_rmpp(mad_reg_req->mgmt_class)) {
 279			if (rmpp_version) {
 280				dev_notice(&device->dev,
 281					   "ib_register_mad_agent: RMPP version for non-RMPP class 0x%x\n",
 282					   mad_reg_req->mgmt_class);
 283				goto error1;
 284			}
 285		}
 286
 287		/* Make sure class supplied is consistent with QP type */
 288		if (qp_type == IB_QPT_SMI) {
 289			if ((mad_reg_req->mgmt_class !=
 290					IB_MGMT_CLASS_SUBN_LID_ROUTED) &&
 291			    (mad_reg_req->mgmt_class !=
 292					IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)) {
 293				dev_notice(&device->dev,
 294					   "ib_register_mad_agent: Invalid SM QP type: class 0x%x\n",
 295					   mad_reg_req->mgmt_class);
 296				goto error1;
 297			}
 298		} else {
 299			if ((mad_reg_req->mgmt_class ==
 300					IB_MGMT_CLASS_SUBN_LID_ROUTED) ||
 301			    (mad_reg_req->mgmt_class ==
 302					IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)) {
 303				dev_notice(&device->dev,
 304					   "ib_register_mad_agent: Invalid GS QP type: class 0x%x\n",
 305					   mad_reg_req->mgmt_class);
 306				goto error1;
 307			}
 308		}
 309	} else {
 310		/* No registration request supplied */
 311		if (!send_handler)
 312			goto error1;
 313		if (registration_flags & IB_MAD_USER_RMPP)
 314			goto error1;
 315	}
 316
 317	/* Validate device and port */
 318	port_priv = ib_get_mad_port(device, port_num);
 319	if (!port_priv) {
 320		dev_notice(&device->dev,
 321			   "ib_register_mad_agent: Invalid port %d\n",
 322			   port_num);
 323		ret = ERR_PTR(-ENODEV);
 324		goto error1;
 325	}
 326
 327	/* Verify the QP requested is supported.  For example, Ethernet devices
 328	 * will not have QP0 */
 329	if (!port_priv->qp_info[qpn].qp) {
 330		dev_notice(&device->dev,
 331			   "ib_register_mad_agent: QP %d not supported\n", qpn);
 332		ret = ERR_PTR(-EPROTONOSUPPORT);
 333		goto error1;
 334	}
 335
 336	/* Allocate structures */
 337	mad_agent_priv = kzalloc(sizeof *mad_agent_priv, GFP_KERNEL);
 338	if (!mad_agent_priv) {
 339		ret = ERR_PTR(-ENOMEM);
 340		goto error1;
 341	}
 342
 
 
 
 
 
 
 
 343	if (mad_reg_req) {
 344		reg_req = kmemdup(mad_reg_req, sizeof *reg_req, GFP_KERNEL);
 345		if (!reg_req) {
 346			ret = ERR_PTR(-ENOMEM);
 347			goto error3;
 348		}
 349	}
 350
 351	/* Now, fill in the various structures */
 352	mad_agent_priv->qp_info = &port_priv->qp_info[qpn];
 353	mad_agent_priv->reg_req = reg_req;
 354	mad_agent_priv->agent.rmpp_version = rmpp_version;
 355	mad_agent_priv->agent.device = device;
 356	mad_agent_priv->agent.recv_handler = recv_handler;
 357	mad_agent_priv->agent.send_handler = send_handler;
 358	mad_agent_priv->agent.context = context;
 359	mad_agent_priv->agent.qp = port_priv->qp_info[qpn].qp;
 360	mad_agent_priv->agent.port_num = port_num;
 361	mad_agent_priv->agent.flags = registration_flags;
 362	spin_lock_init(&mad_agent_priv->lock);
 363	INIT_LIST_HEAD(&mad_agent_priv->send_list);
 364	INIT_LIST_HEAD(&mad_agent_priv->wait_list);
 365	INIT_LIST_HEAD(&mad_agent_priv->done_list);
 366	INIT_LIST_HEAD(&mad_agent_priv->rmpp_list);
 367	INIT_DELAYED_WORK(&mad_agent_priv->timed_work, timeout_sends);
 368	INIT_LIST_HEAD(&mad_agent_priv->local_list);
 369	INIT_WORK(&mad_agent_priv->local_work, local_completions);
 370	atomic_set(&mad_agent_priv->refcount, 1);
 371	init_completion(&mad_agent_priv->comp);
 372
 373	ret2 = ib_mad_agent_security_setup(&mad_agent_priv->agent, qp_type);
 374	if (ret2) {
 375		ret = ERR_PTR(ret2);
 376		goto error4;
 377	}
 378
 379	spin_lock_irqsave(&port_priv->reg_lock, flags);
 380	mad_agent_priv->agent.hi_tid = atomic_inc_return(&ib_mad_client_id);
 381
 382	/*
 383	 * Make sure MAD registration (if supplied)
 384	 * is non overlapping with any existing ones
 385	 */
 386	if (mad_reg_req) {
 387		mgmt_class = convert_mgmt_class(mad_reg_req->mgmt_class);
 388		if (!is_vendor_class(mgmt_class)) {
 389			class = port_priv->version[mad_reg_req->
 390						   mgmt_class_version].class;
 391			if (class) {
 392				method = class->method_table[mgmt_class];
 393				if (method) {
 394					if (method_in_use(&method,
 395							   mad_reg_req))
 396						goto error5;
 397				}
 398			}
 399			ret2 = add_nonoui_reg_req(mad_reg_req, mad_agent_priv,
 400						  mgmt_class);
 401		} else {
 402			/* "New" vendor class range */
 403			vendor = port_priv->version[mad_reg_req->
 404						    mgmt_class_version].vendor;
 405			if (vendor) {
 406				vclass = vendor_class_index(mgmt_class);
 407				vendor_class = vendor->vendor_class[vclass];
 408				if (vendor_class) {
 409					if (is_vendor_method_in_use(
 410							vendor_class,
 411							mad_reg_req))
 412						goto error5;
 413				}
 414			}
 415			ret2 = add_oui_reg_req(mad_reg_req, mad_agent_priv);
 416		}
 417		if (ret2) {
 418			ret = ERR_PTR(ret2);
 419			goto error5;
 420		}
 421	}
 422
 423	/* Add mad agent into port's agent list */
 424	list_add_tail(&mad_agent_priv->agent_list, &port_priv->agent_list);
 425	spin_unlock_irqrestore(&port_priv->reg_lock, flags);
 426
 427	return &mad_agent_priv->agent;
 428error5:
 
 429	spin_unlock_irqrestore(&port_priv->reg_lock, flags);
 430	ib_mad_agent_security_cleanup(&mad_agent_priv->agent);
 431error4:
 432	kfree(reg_req);
 433error3:
 
 
 434	kfree(mad_agent_priv);
 435error1:
 436	return ret;
 437}
 438EXPORT_SYMBOL(ib_register_mad_agent);
 439
 440static inline int is_snooping_sends(int mad_snoop_flags)
 441{
 442	return (mad_snoop_flags &
 443		(/*IB_MAD_SNOOP_POSTED_SENDS |
 444		 IB_MAD_SNOOP_RMPP_SENDS |*/
 445		 IB_MAD_SNOOP_SEND_COMPLETIONS /*|
 446		 IB_MAD_SNOOP_RMPP_SEND_COMPLETIONS*/));
 447}
 448
 449static inline int is_snooping_recvs(int mad_snoop_flags)
 450{
 451	return (mad_snoop_flags &
 452		(IB_MAD_SNOOP_RECVS /*|
 453		 IB_MAD_SNOOP_RMPP_RECVS*/));
 454}
 455
 456static int register_snoop_agent(struct ib_mad_qp_info *qp_info,
 457				struct ib_mad_snoop_private *mad_snoop_priv)
 458{
 459	struct ib_mad_snoop_private **new_snoop_table;
 460	unsigned long flags;
 461	int i;
 462
 463	spin_lock_irqsave(&qp_info->snoop_lock, flags);
 464	/* Check for empty slot in array. */
 465	for (i = 0; i < qp_info->snoop_table_size; i++)
 466		if (!qp_info->snoop_table[i])
 467			break;
 468
 469	if (i == qp_info->snoop_table_size) {
 470		/* Grow table. */
 471		new_snoop_table = krealloc(qp_info->snoop_table,
 472					   sizeof mad_snoop_priv *
 473					   (qp_info->snoop_table_size + 1),
 474					   GFP_ATOMIC);
 475		if (!new_snoop_table) {
 476			i = -ENOMEM;
 477			goto out;
 478		}
 479
 480		qp_info->snoop_table = new_snoop_table;
 481		qp_info->snoop_table_size++;
 482	}
 483	qp_info->snoop_table[i] = mad_snoop_priv;
 484	atomic_inc(&qp_info->snoop_count);
 485out:
 486	spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 487	return i;
 488}
 489
 490struct ib_mad_agent *ib_register_mad_snoop(struct ib_device *device,
 491					   u8 port_num,
 492					   enum ib_qp_type qp_type,
 493					   int mad_snoop_flags,
 494					   ib_mad_snoop_handler snoop_handler,
 495					   ib_mad_recv_handler recv_handler,
 496					   void *context)
 497{
 498	struct ib_mad_port_private *port_priv;
 499	struct ib_mad_agent *ret;
 500	struct ib_mad_snoop_private *mad_snoop_priv;
 501	int qpn;
 502	int err;
 503
 504	/* Validate parameters */
 505	if ((is_snooping_sends(mad_snoop_flags) && !snoop_handler) ||
 506	    (is_snooping_recvs(mad_snoop_flags) && !recv_handler)) {
 507		ret = ERR_PTR(-EINVAL);
 508		goto error1;
 509	}
 510	qpn = get_spl_qp_index(qp_type);
 511	if (qpn == -1) {
 512		ret = ERR_PTR(-EINVAL);
 513		goto error1;
 514	}
 515	port_priv = ib_get_mad_port(device, port_num);
 516	if (!port_priv) {
 517		ret = ERR_PTR(-ENODEV);
 518		goto error1;
 519	}
 520	/* Allocate structures */
 521	mad_snoop_priv = kzalloc(sizeof *mad_snoop_priv, GFP_KERNEL);
 522	if (!mad_snoop_priv) {
 523		ret = ERR_PTR(-ENOMEM);
 524		goto error1;
 525	}
 526
 527	/* Now, fill in the various structures */
 528	mad_snoop_priv->qp_info = &port_priv->qp_info[qpn];
 529	mad_snoop_priv->agent.device = device;
 530	mad_snoop_priv->agent.recv_handler = recv_handler;
 531	mad_snoop_priv->agent.snoop_handler = snoop_handler;
 532	mad_snoop_priv->agent.context = context;
 533	mad_snoop_priv->agent.qp = port_priv->qp_info[qpn].qp;
 534	mad_snoop_priv->agent.port_num = port_num;
 535	mad_snoop_priv->mad_snoop_flags = mad_snoop_flags;
 536	init_completion(&mad_snoop_priv->comp);
 537
 538	err = ib_mad_agent_security_setup(&mad_snoop_priv->agent, qp_type);
 539	if (err) {
 540		ret = ERR_PTR(err);
 541		goto error2;
 542	}
 543
 544	mad_snoop_priv->snoop_index = register_snoop_agent(
 545						&port_priv->qp_info[qpn],
 546						mad_snoop_priv);
 547	if (mad_snoop_priv->snoop_index < 0) {
 548		ret = ERR_PTR(mad_snoop_priv->snoop_index);
 549		goto error3;
 550	}
 551
 552	atomic_set(&mad_snoop_priv->refcount, 1);
 553	return &mad_snoop_priv->agent;
 554error3:
 555	ib_mad_agent_security_cleanup(&mad_snoop_priv->agent);
 556error2:
 557	kfree(mad_snoop_priv);
 558error1:
 559	return ret;
 560}
 561EXPORT_SYMBOL(ib_register_mad_snoop);
 562
 563static inline void deref_mad_agent(struct ib_mad_agent_private *mad_agent_priv)
 564{
 565	if (atomic_dec_and_test(&mad_agent_priv->refcount))
 566		complete(&mad_agent_priv->comp);
 567}
 568
 569static inline void deref_snoop_agent(struct ib_mad_snoop_private *mad_snoop_priv)
 570{
 571	if (atomic_dec_and_test(&mad_snoop_priv->refcount))
 572		complete(&mad_snoop_priv->comp);
 573}
 574
 575static void unregister_mad_agent(struct ib_mad_agent_private *mad_agent_priv)
 576{
 577	struct ib_mad_port_private *port_priv;
 578	unsigned long flags;
 579
 580	/* Note that we could still be handling received MADs */
 581
 582	/*
 583	 * Canceling all sends results in dropping received response
 584	 * MADs, preventing us from queuing additional work
 585	 */
 586	cancel_mads(mad_agent_priv);
 587	port_priv = mad_agent_priv->qp_info->port_priv;
 588	cancel_delayed_work(&mad_agent_priv->timed_work);
 589
 590	spin_lock_irqsave(&port_priv->reg_lock, flags);
 591	remove_mad_reg_req(mad_agent_priv);
 592	list_del(&mad_agent_priv->agent_list);
 593	spin_unlock_irqrestore(&port_priv->reg_lock, flags);
 594
 595	flush_workqueue(port_priv->wq);
 596	ib_cancel_rmpp_recvs(mad_agent_priv);
 597
 598	deref_mad_agent(mad_agent_priv);
 599	wait_for_completion(&mad_agent_priv->comp);
 600
 601	ib_mad_agent_security_cleanup(&mad_agent_priv->agent);
 602
 603	kfree(mad_agent_priv->reg_req);
 
 604	kfree(mad_agent_priv);
 605}
 606
 607static void unregister_mad_snoop(struct ib_mad_snoop_private *mad_snoop_priv)
 608{
 609	struct ib_mad_qp_info *qp_info;
 610	unsigned long flags;
 611
 612	qp_info = mad_snoop_priv->qp_info;
 613	spin_lock_irqsave(&qp_info->snoop_lock, flags);
 614	qp_info->snoop_table[mad_snoop_priv->snoop_index] = NULL;
 615	atomic_dec(&qp_info->snoop_count);
 616	spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 617
 618	deref_snoop_agent(mad_snoop_priv);
 619	wait_for_completion(&mad_snoop_priv->comp);
 620
 621	ib_mad_agent_security_cleanup(&mad_snoop_priv->agent);
 622
 623	kfree(mad_snoop_priv);
 624}
 625
 626/*
 627 * ib_unregister_mad_agent - Unregisters a client from using MAD services
 628 */
 629void ib_unregister_mad_agent(struct ib_mad_agent *mad_agent)
 630{
 631	struct ib_mad_agent_private *mad_agent_priv;
 632	struct ib_mad_snoop_private *mad_snoop_priv;
 633
 634	/* If the TID is zero, the agent can only snoop. */
 635	if (mad_agent->hi_tid) {
 636		mad_agent_priv = container_of(mad_agent,
 637					      struct ib_mad_agent_private,
 638					      agent);
 639		unregister_mad_agent(mad_agent_priv);
 640	} else {
 641		mad_snoop_priv = container_of(mad_agent,
 642					      struct ib_mad_snoop_private,
 643					      agent);
 644		unregister_mad_snoop(mad_snoop_priv);
 645	}
 
 646}
 647EXPORT_SYMBOL(ib_unregister_mad_agent);
 648
 649static void dequeue_mad(struct ib_mad_list_head *mad_list)
 650{
 651	struct ib_mad_queue *mad_queue;
 652	unsigned long flags;
 653
 654	BUG_ON(!mad_list->mad_queue);
 655	mad_queue = mad_list->mad_queue;
 656	spin_lock_irqsave(&mad_queue->lock, flags);
 657	list_del(&mad_list->list);
 658	mad_queue->count--;
 659	spin_unlock_irqrestore(&mad_queue->lock, flags);
 660}
 661
 662static void snoop_send(struct ib_mad_qp_info *qp_info,
 663		       struct ib_mad_send_buf *send_buf,
 664		       struct ib_mad_send_wc *mad_send_wc,
 665		       int mad_snoop_flags)
 666{
 667	struct ib_mad_snoop_private *mad_snoop_priv;
 668	unsigned long flags;
 669	int i;
 670
 671	spin_lock_irqsave(&qp_info->snoop_lock, flags);
 672	for (i = 0; i < qp_info->snoop_table_size; i++) {
 673		mad_snoop_priv = qp_info->snoop_table[i];
 674		if (!mad_snoop_priv ||
 675		    !(mad_snoop_priv->mad_snoop_flags & mad_snoop_flags))
 676			continue;
 677
 678		atomic_inc(&mad_snoop_priv->refcount);
 679		spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 680		mad_snoop_priv->agent.snoop_handler(&mad_snoop_priv->agent,
 681						    send_buf, mad_send_wc);
 682		deref_snoop_agent(mad_snoop_priv);
 683		spin_lock_irqsave(&qp_info->snoop_lock, flags);
 684	}
 685	spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 686}
 687
 688static void snoop_recv(struct ib_mad_qp_info *qp_info,
 689		       struct ib_mad_recv_wc *mad_recv_wc,
 690		       int mad_snoop_flags)
 691{
 692	struct ib_mad_snoop_private *mad_snoop_priv;
 693	unsigned long flags;
 694	int i;
 695
 696	spin_lock_irqsave(&qp_info->snoop_lock, flags);
 697	for (i = 0; i < qp_info->snoop_table_size; i++) {
 698		mad_snoop_priv = qp_info->snoop_table[i];
 699		if (!mad_snoop_priv ||
 700		    !(mad_snoop_priv->mad_snoop_flags & mad_snoop_flags))
 701			continue;
 702
 703		atomic_inc(&mad_snoop_priv->refcount);
 704		spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 705		mad_snoop_priv->agent.recv_handler(&mad_snoop_priv->agent, NULL,
 706						   mad_recv_wc);
 707		deref_snoop_agent(mad_snoop_priv);
 708		spin_lock_irqsave(&qp_info->snoop_lock, flags);
 709	}
 710	spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
 711}
 712
 713static void build_smp_wc(struct ib_qp *qp, struct ib_cqe *cqe, u16 slid,
 714		u16 pkey_index, u8 port_num, struct ib_wc *wc)
 
 715{
 716	memset(wc, 0, sizeof *wc);
 717	wc->wr_cqe = cqe;
 718	wc->status = IB_WC_SUCCESS;
 719	wc->opcode = IB_WC_RECV;
 720	wc->pkey_index = pkey_index;
 721	wc->byte_len = sizeof(struct ib_mad) + sizeof(struct ib_grh);
 722	wc->src_qp = IB_QP0;
 723	wc->qp = qp;
 724	wc->slid = slid;
 725	wc->sl = 0;
 726	wc->dlid_path_bits = 0;
 727	wc->port_num = port_num;
 728}
 729
 730static size_t mad_priv_size(const struct ib_mad_private *mp)
 731{
 732	return sizeof(struct ib_mad_private) + mp->mad_size;
 733}
 734
 735static struct ib_mad_private *alloc_mad_private(size_t mad_size, gfp_t flags)
 736{
 737	size_t size = sizeof(struct ib_mad_private) + mad_size;
 738	struct ib_mad_private *ret = kzalloc(size, flags);
 739
 740	if (ret)
 741		ret->mad_size = mad_size;
 742
 743	return ret;
 744}
 745
 746static size_t port_mad_size(const struct ib_mad_port_private *port_priv)
 747{
 748	return rdma_max_mad_size(port_priv->device, port_priv->port_num);
 749}
 750
 751static size_t mad_priv_dma_size(const struct ib_mad_private *mp)
 752{
 753	return sizeof(struct ib_grh) + mp->mad_size;
 754}
 755
 756/*
 757 * Return 0 if SMP is to be sent
 758 * Return 1 if SMP was consumed locally (whether or not solicited)
 759 * Return < 0 if error
 760 */
 761static int handle_outgoing_dr_smp(struct ib_mad_agent_private *mad_agent_priv,
 762				  struct ib_mad_send_wr_private *mad_send_wr)
 763{
 764	int ret = 0;
 765	struct ib_smp *smp = mad_send_wr->send_buf.mad;
 766	struct opa_smp *opa_smp = (struct opa_smp *)smp;
 767	unsigned long flags;
 768	struct ib_mad_local_private *local;
 769	struct ib_mad_private *mad_priv;
 770	struct ib_mad_port_private *port_priv;
 771	struct ib_mad_agent_private *recv_mad_agent = NULL;
 772	struct ib_device *device = mad_agent_priv->agent.device;
 773	u8 port_num;
 774	struct ib_wc mad_wc;
 775	struct ib_ud_wr *send_wr = &mad_send_wr->send_wr;
 776	size_t mad_size = port_mad_size(mad_agent_priv->qp_info->port_priv);
 777	u16 out_mad_pkey_index = 0;
 778	u16 drslid;
 779	bool opa = rdma_cap_opa_mad(mad_agent_priv->qp_info->port_priv->device,
 780				    mad_agent_priv->qp_info->port_priv->port_num);
 781
 782	if (rdma_cap_ib_switch(device) &&
 783	    smp->mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)
 784		port_num = send_wr->port_num;
 785	else
 786		port_num = mad_agent_priv->agent.port_num;
 787
 788	/*
 789	 * Directed route handling starts if the initial LID routed part of
 790	 * a request or the ending LID routed part of a response is empty.
 791	 * If we are at the start of the LID routed part, don't update the
 792	 * hop_ptr or hop_cnt.  See section 14.2.2, Vol 1 IB spec.
 793	 */
 794	if (opa && smp->class_version == OPA_SM_CLASS_VERSION) {
 795		u32 opa_drslid;
 
 
 
 
 
 
 796
 797		if ((opa_get_smp_direction(opa_smp)
 798		     ? opa_smp->route.dr.dr_dlid : opa_smp->route.dr.dr_slid) ==
 799		     OPA_LID_PERMISSIVE &&
 800		     opa_smi_handle_dr_smp_send(opa_smp,
 801						rdma_cap_ib_switch(device),
 802						port_num) == IB_SMI_DISCARD) {
 803			ret = -EINVAL;
 804			dev_err(&device->dev, "OPA Invalid directed route\n");
 805			goto out;
 806		}
 807		opa_drslid = be32_to_cpu(opa_smp->route.dr.dr_slid);
 808		if (opa_drslid != be32_to_cpu(OPA_LID_PERMISSIVE) &&
 809		    opa_drslid & 0xffff0000) {
 810			ret = -EINVAL;
 811			dev_err(&device->dev, "OPA Invalid dr_slid 0x%x\n",
 812			       opa_drslid);
 813			goto out;
 814		}
 815		drslid = (u16)(opa_drslid & 0x0000ffff);
 816
 817		/* Check to post send on QP or process locally */
 818		if (opa_smi_check_local_smp(opa_smp, device) == IB_SMI_DISCARD &&
 819		    opa_smi_check_local_returning_smp(opa_smp, device) == IB_SMI_DISCARD)
 820			goto out;
 821	} else {
 822		if ((ib_get_smp_direction(smp) ? smp->dr_dlid : smp->dr_slid) ==
 823		     IB_LID_PERMISSIVE &&
 824		     smi_handle_dr_smp_send(smp, rdma_cap_ib_switch(device), port_num) ==
 825		     IB_SMI_DISCARD) {
 826			ret = -EINVAL;
 827			dev_err(&device->dev, "Invalid directed route\n");
 828			goto out;
 829		}
 830		drslid = be16_to_cpu(smp->dr_slid);
 831
 832		/* Check to post send on QP or process locally */
 833		if (smi_check_local_smp(smp, device) == IB_SMI_DISCARD &&
 834		    smi_check_local_returning_smp(smp, device) == IB_SMI_DISCARD)
 835			goto out;
 836	}
 837
 838	local = kmalloc(sizeof *local, GFP_ATOMIC);
 839	if (!local) {
 840		ret = -ENOMEM;
 
 841		goto out;
 842	}
 843	local->mad_priv = NULL;
 844	local->recv_mad_agent = NULL;
 845	mad_priv = alloc_mad_private(mad_size, GFP_ATOMIC);
 846	if (!mad_priv) {
 847		ret = -ENOMEM;
 
 848		kfree(local);
 849		goto out;
 850	}
 851
 852	build_smp_wc(mad_agent_priv->agent.qp,
 853		     send_wr->wr.wr_cqe, drslid,
 854		     send_wr->pkey_index,
 855		     send_wr->port_num, &mad_wc);
 856
 857	if (opa && smp->base_version == OPA_MGMT_BASE_VERSION) {
 858		mad_wc.byte_len = mad_send_wr->send_buf.hdr_len
 859					+ mad_send_wr->send_buf.data_len
 860					+ sizeof(struct ib_grh);
 861	}
 862
 863	/* No GRH for DR SMP */
 864	ret = device->process_mad(device, 0, port_num, &mad_wc, NULL,
 865				  (const struct ib_mad_hdr *)smp, mad_size,
 866				  (struct ib_mad_hdr *)mad_priv->mad,
 867				  &mad_size, &out_mad_pkey_index);
 868	switch (ret)
 869	{
 870	case IB_MAD_RESULT_SUCCESS | IB_MAD_RESULT_REPLY:
 871		if (ib_response_mad((const struct ib_mad_hdr *)mad_priv->mad) &&
 872		    mad_agent_priv->agent.recv_handler) {
 873			local->mad_priv = mad_priv;
 874			local->recv_mad_agent = mad_agent_priv;
 875			/*
 876			 * Reference MAD agent until receive
 877			 * side of local completion handled
 878			 */
 879			atomic_inc(&mad_agent_priv->refcount);
 880		} else
 881			kfree(mad_priv);
 882		break;
 883	case IB_MAD_RESULT_SUCCESS | IB_MAD_RESULT_CONSUMED:
 884		kfree(mad_priv);
 885		break;
 886	case IB_MAD_RESULT_SUCCESS:
 887		/* Treat like an incoming receive MAD */
 888		port_priv = ib_get_mad_port(mad_agent_priv->agent.device,
 889					    mad_agent_priv->agent.port_num);
 890		if (port_priv) {
 891			memcpy(mad_priv->mad, smp, mad_priv->mad_size);
 892			recv_mad_agent = find_mad_agent(port_priv,
 893						        (const struct ib_mad_hdr *)mad_priv->mad);
 894		}
 895		if (!port_priv || !recv_mad_agent) {
 896			/*
 897			 * No receiving agent so drop packet and
 898			 * generate send completion.
 899			 */
 900			kfree(mad_priv);
 901			break;
 902		}
 903		local->mad_priv = mad_priv;
 904		local->recv_mad_agent = recv_mad_agent;
 905		break;
 906	default:
 907		kfree(mad_priv);
 908		kfree(local);
 909		ret = -EINVAL;
 910		goto out;
 911	}
 912
 913	local->mad_send_wr = mad_send_wr;
 914	if (opa) {
 915		local->mad_send_wr->send_wr.pkey_index = out_mad_pkey_index;
 916		local->return_wc_byte_len = mad_size;
 917	}
 918	/* Reference MAD agent until send side of local completion handled */
 919	atomic_inc(&mad_agent_priv->refcount);
 920	/* Queue local completion to local list */
 921	spin_lock_irqsave(&mad_agent_priv->lock, flags);
 922	list_add_tail(&local->completion_list, &mad_agent_priv->local_list);
 923	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
 924	queue_work(mad_agent_priv->qp_info->port_priv->wq,
 925		   &mad_agent_priv->local_work);
 926	ret = 1;
 927out:
 928	return ret;
 929}
 930
 931static int get_pad_size(int hdr_len, int data_len, size_t mad_size)
 932{
 933	int seg_size, pad;
 934
 935	seg_size = mad_size - hdr_len;
 936	if (data_len && seg_size) {
 937		pad = seg_size - data_len % seg_size;
 938		return pad == seg_size ? 0 : pad;
 939	} else
 940		return seg_size;
 941}
 942
 943static void free_send_rmpp_list(struct ib_mad_send_wr_private *mad_send_wr)
 944{
 945	struct ib_rmpp_segment *s, *t;
 946
 947	list_for_each_entry_safe(s, t, &mad_send_wr->rmpp_list, list) {
 948		list_del(&s->list);
 949		kfree(s);
 950	}
 951}
 952
 953static int alloc_send_rmpp_list(struct ib_mad_send_wr_private *send_wr,
 954				size_t mad_size, gfp_t gfp_mask)
 955{
 956	struct ib_mad_send_buf *send_buf = &send_wr->send_buf;
 957	struct ib_rmpp_mad *rmpp_mad = send_buf->mad;
 958	struct ib_rmpp_segment *seg = NULL;
 959	int left, seg_size, pad;
 960
 961	send_buf->seg_size = mad_size - send_buf->hdr_len;
 962	send_buf->seg_rmpp_size = mad_size - IB_MGMT_RMPP_HDR;
 963	seg_size = send_buf->seg_size;
 964	pad = send_wr->pad;
 965
 966	/* Allocate data segments. */
 967	for (left = send_buf->data_len + pad; left > 0; left -= seg_size) {
 968		seg = kmalloc(sizeof (*seg) + seg_size, gfp_mask);
 969		if (!seg) {
 
 
 
 970			free_send_rmpp_list(send_wr);
 971			return -ENOMEM;
 972		}
 973		seg->num = ++send_buf->seg_count;
 974		list_add_tail(&seg->list, &send_wr->rmpp_list);
 975	}
 976
 977	/* Zero any padding */
 978	if (pad)
 979		memset(seg->data + seg_size - pad, 0, pad);
 980
 981	rmpp_mad->rmpp_hdr.rmpp_version = send_wr->mad_agent_priv->
 982					  agent.rmpp_version;
 983	rmpp_mad->rmpp_hdr.rmpp_type = IB_MGMT_RMPP_TYPE_DATA;
 984	ib_set_rmpp_flags(&rmpp_mad->rmpp_hdr, IB_MGMT_RMPP_FLAG_ACTIVE);
 985
 986	send_wr->cur_seg = container_of(send_wr->rmpp_list.next,
 987					struct ib_rmpp_segment, list);
 988	send_wr->last_ack_seg = send_wr->cur_seg;
 989	return 0;
 990}
 991
 992int ib_mad_kernel_rmpp_agent(const struct ib_mad_agent *agent)
 993{
 994	return agent->rmpp_version && !(agent->flags & IB_MAD_USER_RMPP);
 995}
 996EXPORT_SYMBOL(ib_mad_kernel_rmpp_agent);
 997
 998struct ib_mad_send_buf * ib_create_send_mad(struct ib_mad_agent *mad_agent,
 999					    u32 remote_qpn, u16 pkey_index,
1000					    int rmpp_active,
1001					    int hdr_len, int data_len,
1002					    gfp_t gfp_mask,
1003					    u8 base_version)
1004{
1005	struct ib_mad_agent_private *mad_agent_priv;
1006	struct ib_mad_send_wr_private *mad_send_wr;
1007	int pad, message_size, ret, size;
1008	void *buf;
1009	size_t mad_size;
1010	bool opa;
1011
1012	mad_agent_priv = container_of(mad_agent, struct ib_mad_agent_private,
1013				      agent);
1014
1015	opa = rdma_cap_opa_mad(mad_agent->device, mad_agent->port_num);
1016
1017	if (opa && base_version == OPA_MGMT_BASE_VERSION)
1018		mad_size = sizeof(struct opa_mad);
1019	else
1020		mad_size = sizeof(struct ib_mad);
1021
1022	pad = get_pad_size(hdr_len, data_len, mad_size);
1023	message_size = hdr_len + data_len + pad;
1024
1025	if (ib_mad_kernel_rmpp_agent(mad_agent)) {
1026		if (!rmpp_active && message_size > mad_size)
1027			return ERR_PTR(-EINVAL);
1028	} else
1029		if (rmpp_active || message_size > mad_size)
1030			return ERR_PTR(-EINVAL);
1031
1032	size = rmpp_active ? hdr_len : mad_size;
1033	buf = kzalloc(sizeof *mad_send_wr + size, gfp_mask);
1034	if (!buf)
1035		return ERR_PTR(-ENOMEM);
1036
1037	mad_send_wr = buf + size;
1038	INIT_LIST_HEAD(&mad_send_wr->rmpp_list);
1039	mad_send_wr->send_buf.mad = buf;
1040	mad_send_wr->send_buf.hdr_len = hdr_len;
1041	mad_send_wr->send_buf.data_len = data_len;
1042	mad_send_wr->pad = pad;
1043
1044	mad_send_wr->mad_agent_priv = mad_agent_priv;
1045	mad_send_wr->sg_list[0].length = hdr_len;
1046	mad_send_wr->sg_list[0].lkey = mad_agent->qp->pd->local_dma_lkey;
1047
1048	/* OPA MADs don't have to be the full 2048 bytes */
1049	if (opa && base_version == OPA_MGMT_BASE_VERSION &&
1050	    data_len < mad_size - hdr_len)
1051		mad_send_wr->sg_list[1].length = data_len;
1052	else
1053		mad_send_wr->sg_list[1].length = mad_size - hdr_len;
1054
1055	mad_send_wr->sg_list[1].lkey = mad_agent->qp->pd->local_dma_lkey;
1056
1057	mad_send_wr->mad_list.cqe.done = ib_mad_send_done;
1058
1059	mad_send_wr->send_wr.wr.wr_cqe = &mad_send_wr->mad_list.cqe;
1060	mad_send_wr->send_wr.wr.sg_list = mad_send_wr->sg_list;
1061	mad_send_wr->send_wr.wr.num_sge = 2;
1062	mad_send_wr->send_wr.wr.opcode = IB_WR_SEND;
1063	mad_send_wr->send_wr.wr.send_flags = IB_SEND_SIGNALED;
1064	mad_send_wr->send_wr.remote_qpn = remote_qpn;
1065	mad_send_wr->send_wr.remote_qkey = IB_QP_SET_QKEY;
1066	mad_send_wr->send_wr.pkey_index = pkey_index;
1067
1068	if (rmpp_active) {
1069		ret = alloc_send_rmpp_list(mad_send_wr, mad_size, gfp_mask);
1070		if (ret) {
1071			kfree(buf);
1072			return ERR_PTR(ret);
1073		}
1074	}
1075
1076	mad_send_wr->send_buf.mad_agent = mad_agent;
1077	atomic_inc(&mad_agent_priv->refcount);
1078	return &mad_send_wr->send_buf;
1079}
1080EXPORT_SYMBOL(ib_create_send_mad);
1081
1082int ib_get_mad_data_offset(u8 mgmt_class)
1083{
1084	if (mgmt_class == IB_MGMT_CLASS_SUBN_ADM)
1085		return IB_MGMT_SA_HDR;
1086	else if ((mgmt_class == IB_MGMT_CLASS_DEVICE_MGMT) ||
1087		 (mgmt_class == IB_MGMT_CLASS_DEVICE_ADM) ||
1088		 (mgmt_class == IB_MGMT_CLASS_BIS))
1089		return IB_MGMT_DEVICE_HDR;
1090	else if ((mgmt_class >= IB_MGMT_CLASS_VENDOR_RANGE2_START) &&
1091		 (mgmt_class <= IB_MGMT_CLASS_VENDOR_RANGE2_END))
1092		return IB_MGMT_VENDOR_HDR;
1093	else
1094		return IB_MGMT_MAD_HDR;
1095}
1096EXPORT_SYMBOL(ib_get_mad_data_offset);
1097
1098int ib_is_mad_class_rmpp(u8 mgmt_class)
1099{
1100	if ((mgmt_class == IB_MGMT_CLASS_SUBN_ADM) ||
1101	    (mgmt_class == IB_MGMT_CLASS_DEVICE_MGMT) ||
1102	    (mgmt_class == IB_MGMT_CLASS_DEVICE_ADM) ||
1103	    (mgmt_class == IB_MGMT_CLASS_BIS) ||
1104	    ((mgmt_class >= IB_MGMT_CLASS_VENDOR_RANGE2_START) &&
1105	     (mgmt_class <= IB_MGMT_CLASS_VENDOR_RANGE2_END)))
1106		return 1;
1107	return 0;
1108}
1109EXPORT_SYMBOL(ib_is_mad_class_rmpp);
1110
1111void *ib_get_rmpp_segment(struct ib_mad_send_buf *send_buf, int seg_num)
1112{
1113	struct ib_mad_send_wr_private *mad_send_wr;
1114	struct list_head *list;
1115
1116	mad_send_wr = container_of(send_buf, struct ib_mad_send_wr_private,
1117				   send_buf);
1118	list = &mad_send_wr->cur_seg->list;
1119
1120	if (mad_send_wr->cur_seg->num < seg_num) {
1121		list_for_each_entry(mad_send_wr->cur_seg, list, list)
1122			if (mad_send_wr->cur_seg->num == seg_num)
1123				break;
1124	} else if (mad_send_wr->cur_seg->num > seg_num) {
1125		list_for_each_entry_reverse(mad_send_wr->cur_seg, list, list)
1126			if (mad_send_wr->cur_seg->num == seg_num)
1127				break;
1128	}
1129	return mad_send_wr->cur_seg->data;
1130}
1131EXPORT_SYMBOL(ib_get_rmpp_segment);
1132
1133static inline void *ib_get_payload(struct ib_mad_send_wr_private *mad_send_wr)
1134{
1135	if (mad_send_wr->send_buf.seg_count)
1136		return ib_get_rmpp_segment(&mad_send_wr->send_buf,
1137					   mad_send_wr->seg_num);
1138	else
1139		return mad_send_wr->send_buf.mad +
1140		       mad_send_wr->send_buf.hdr_len;
1141}
1142
1143void ib_free_send_mad(struct ib_mad_send_buf *send_buf)
1144{
1145	struct ib_mad_agent_private *mad_agent_priv;
1146	struct ib_mad_send_wr_private *mad_send_wr;
1147
1148	mad_agent_priv = container_of(send_buf->mad_agent,
1149				      struct ib_mad_agent_private, agent);
1150	mad_send_wr = container_of(send_buf, struct ib_mad_send_wr_private,
1151				   send_buf);
1152
1153	free_send_rmpp_list(mad_send_wr);
1154	kfree(send_buf->mad);
1155	deref_mad_agent(mad_agent_priv);
1156}
1157EXPORT_SYMBOL(ib_free_send_mad);
1158
1159int ib_send_mad(struct ib_mad_send_wr_private *mad_send_wr)
1160{
1161	struct ib_mad_qp_info *qp_info;
1162	struct list_head *list;
1163	struct ib_send_wr *bad_send_wr;
1164	struct ib_mad_agent *mad_agent;
1165	struct ib_sge *sge;
1166	unsigned long flags;
1167	int ret;
1168
1169	/* Set WR ID to find mad_send_wr upon completion */
1170	qp_info = mad_send_wr->mad_agent_priv->qp_info;
 
1171	mad_send_wr->mad_list.mad_queue = &qp_info->send_queue;
1172	mad_send_wr->mad_list.cqe.done = ib_mad_send_done;
1173	mad_send_wr->send_wr.wr.wr_cqe = &mad_send_wr->mad_list.cqe;
1174
1175	mad_agent = mad_send_wr->send_buf.mad_agent;
1176	sge = mad_send_wr->sg_list;
1177	sge[0].addr = ib_dma_map_single(mad_agent->device,
1178					mad_send_wr->send_buf.mad,
1179					sge[0].length,
1180					DMA_TO_DEVICE);
1181	if (unlikely(ib_dma_mapping_error(mad_agent->device, sge[0].addr)))
1182		return -ENOMEM;
1183
1184	mad_send_wr->header_mapping = sge[0].addr;
1185
1186	sge[1].addr = ib_dma_map_single(mad_agent->device,
1187					ib_get_payload(mad_send_wr),
1188					sge[1].length,
1189					DMA_TO_DEVICE);
1190	if (unlikely(ib_dma_mapping_error(mad_agent->device, sge[1].addr))) {
1191		ib_dma_unmap_single(mad_agent->device,
1192				    mad_send_wr->header_mapping,
1193				    sge[0].length, DMA_TO_DEVICE);
1194		return -ENOMEM;
1195	}
1196	mad_send_wr->payload_mapping = sge[1].addr;
1197
1198	spin_lock_irqsave(&qp_info->send_queue.lock, flags);
1199	if (qp_info->send_queue.count < qp_info->send_queue.max_active) {
1200		ret = ib_post_send(mad_agent->qp, &mad_send_wr->send_wr.wr,
1201				   &bad_send_wr);
1202		list = &qp_info->send_queue.list;
1203	} else {
1204		ret = 0;
1205		list = &qp_info->overflow_list;
1206	}
1207
1208	if (!ret) {
1209		qp_info->send_queue.count++;
1210		list_add_tail(&mad_send_wr->mad_list.list, list);
1211	}
1212	spin_unlock_irqrestore(&qp_info->send_queue.lock, flags);
1213	if (ret) {
1214		ib_dma_unmap_single(mad_agent->device,
1215				    mad_send_wr->header_mapping,
1216				    sge[0].length, DMA_TO_DEVICE);
1217		ib_dma_unmap_single(mad_agent->device,
1218				    mad_send_wr->payload_mapping,
1219				    sge[1].length, DMA_TO_DEVICE);
1220	}
1221	return ret;
1222}
1223
1224/*
1225 * ib_post_send_mad - Posts MAD(s) to the send queue of the QP associated
1226 *  with the registered client
1227 */
1228int ib_post_send_mad(struct ib_mad_send_buf *send_buf,
1229		     struct ib_mad_send_buf **bad_send_buf)
1230{
1231	struct ib_mad_agent_private *mad_agent_priv;
1232	struct ib_mad_send_buf *next_send_buf;
1233	struct ib_mad_send_wr_private *mad_send_wr;
1234	unsigned long flags;
1235	int ret = -EINVAL;
1236
1237	/* Walk list of send WRs and post each on send list */
1238	for (; send_buf; send_buf = next_send_buf) {
 
1239		mad_send_wr = container_of(send_buf,
1240					   struct ib_mad_send_wr_private,
1241					   send_buf);
1242		mad_agent_priv = mad_send_wr->mad_agent_priv;
1243
1244		ret = ib_mad_enforce_security(mad_agent_priv,
1245					      mad_send_wr->send_wr.pkey_index);
1246		if (ret)
1247			goto error;
1248
1249		if (!send_buf->mad_agent->send_handler ||
1250		    (send_buf->timeout_ms &&
1251		     !send_buf->mad_agent->recv_handler)) {
1252			ret = -EINVAL;
1253			goto error;
1254		}
1255
1256		if (!ib_is_mad_class_rmpp(((struct ib_mad_hdr *) send_buf->mad)->mgmt_class)) {
1257			if (mad_agent_priv->agent.rmpp_version) {
1258				ret = -EINVAL;
1259				goto error;
1260			}
1261		}
1262
1263		/*
1264		 * Save pointer to next work request to post in case the
1265		 * current one completes, and the user modifies the work
1266		 * request associated with the completion
1267		 */
1268		next_send_buf = send_buf->next;
1269		mad_send_wr->send_wr.ah = send_buf->ah;
1270
1271		if (((struct ib_mad_hdr *) send_buf->mad)->mgmt_class ==
1272		    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE) {
1273			ret = handle_outgoing_dr_smp(mad_agent_priv,
1274						     mad_send_wr);
1275			if (ret < 0)		/* error */
1276				goto error;
1277			else if (ret == 1)	/* locally consumed */
1278				continue;
1279		}
1280
1281		mad_send_wr->tid = ((struct ib_mad_hdr *) send_buf->mad)->tid;
1282		/* Timeout will be updated after send completes */
1283		mad_send_wr->timeout = msecs_to_jiffies(send_buf->timeout_ms);
1284		mad_send_wr->max_retries = send_buf->retries;
1285		mad_send_wr->retries_left = send_buf->retries;
1286		send_buf->retries = 0;
1287		/* Reference for work request to QP + response */
1288		mad_send_wr->refcount = 1 + (mad_send_wr->timeout > 0);
1289		mad_send_wr->status = IB_WC_SUCCESS;
1290
1291		/* Reference MAD agent until send completes */
1292		atomic_inc(&mad_agent_priv->refcount);
1293		spin_lock_irqsave(&mad_agent_priv->lock, flags);
1294		list_add_tail(&mad_send_wr->agent_list,
1295			      &mad_agent_priv->send_list);
1296		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1297
1298		if (ib_mad_kernel_rmpp_agent(&mad_agent_priv->agent)) {
1299			ret = ib_send_rmpp_mad(mad_send_wr);
1300			if (ret >= 0 && ret != IB_RMPP_RESULT_CONSUMED)
1301				ret = ib_send_mad(mad_send_wr);
1302		} else
1303			ret = ib_send_mad(mad_send_wr);
1304		if (ret < 0) {
1305			/* Fail send request */
1306			spin_lock_irqsave(&mad_agent_priv->lock, flags);
1307			list_del(&mad_send_wr->agent_list);
1308			spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1309			atomic_dec(&mad_agent_priv->refcount);
1310			goto error;
1311		}
1312	}
1313	return 0;
1314error:
1315	if (bad_send_buf)
1316		*bad_send_buf = send_buf;
1317	return ret;
1318}
1319EXPORT_SYMBOL(ib_post_send_mad);
1320
1321/*
1322 * ib_free_recv_mad - Returns data buffers used to receive
1323 *  a MAD to the access layer
1324 */
1325void ib_free_recv_mad(struct ib_mad_recv_wc *mad_recv_wc)
1326{
1327	struct ib_mad_recv_buf *mad_recv_buf, *temp_recv_buf;
1328	struct ib_mad_private_header *mad_priv_hdr;
1329	struct ib_mad_private *priv;
1330	struct list_head free_list;
1331
1332	INIT_LIST_HEAD(&free_list);
1333	list_splice_init(&mad_recv_wc->rmpp_list, &free_list);
1334
1335	list_for_each_entry_safe(mad_recv_buf, temp_recv_buf,
1336					&free_list, list) {
1337		mad_recv_wc = container_of(mad_recv_buf, struct ib_mad_recv_wc,
1338					   recv_buf);
1339		mad_priv_hdr = container_of(mad_recv_wc,
1340					    struct ib_mad_private_header,
1341					    recv_wc);
1342		priv = container_of(mad_priv_hdr, struct ib_mad_private,
1343				    header);
1344		kfree(priv);
1345	}
1346}
1347EXPORT_SYMBOL(ib_free_recv_mad);
1348
1349struct ib_mad_agent *ib_redirect_mad_qp(struct ib_qp *qp,
1350					u8 rmpp_version,
1351					ib_mad_send_handler send_handler,
1352					ib_mad_recv_handler recv_handler,
1353					void *context)
1354{
1355	return ERR_PTR(-EINVAL);	/* XXX: for now */
1356}
1357EXPORT_SYMBOL(ib_redirect_mad_qp);
1358
1359int ib_process_mad_wc(struct ib_mad_agent *mad_agent,
1360		      struct ib_wc *wc)
1361{
1362	dev_err(&mad_agent->device->dev,
1363		"ib_process_mad_wc() not implemented yet\n");
1364	return 0;
1365}
1366EXPORT_SYMBOL(ib_process_mad_wc);
1367
1368static int method_in_use(struct ib_mad_mgmt_method_table **method,
1369			 struct ib_mad_reg_req *mad_reg_req)
1370{
1371	int i;
1372
1373	for_each_set_bit(i, mad_reg_req->method_mask, IB_MGMT_MAX_METHODS) {
1374		if ((*method)->agent[i]) {
1375			pr_err("Method %d already in use\n", i);
1376			return -EINVAL;
1377		}
1378	}
1379	return 0;
1380}
1381
1382static int allocate_method_table(struct ib_mad_mgmt_method_table **method)
1383{
1384	/* Allocate management method table */
1385	*method = kzalloc(sizeof **method, GFP_ATOMIC);
1386	return (*method) ? 0 : (-ENOMEM);
 
 
 
 
 
 
1387}
1388
1389/*
1390 * Check to see if there are any methods still in use
1391 */
1392static int check_method_table(struct ib_mad_mgmt_method_table *method)
1393{
1394	int i;
1395
1396	for (i = 0; i < IB_MGMT_MAX_METHODS; i++)
1397		if (method->agent[i])
1398			return 1;
1399	return 0;
1400}
1401
1402/*
1403 * Check to see if there are any method tables for this class still in use
1404 */
1405static int check_class_table(struct ib_mad_mgmt_class_table *class)
1406{
1407	int i;
1408
1409	for (i = 0; i < MAX_MGMT_CLASS; i++)
1410		if (class->method_table[i])
1411			return 1;
1412	return 0;
1413}
1414
1415static int check_vendor_class(struct ib_mad_mgmt_vendor_class *vendor_class)
1416{
1417	int i;
1418
1419	for (i = 0; i < MAX_MGMT_OUI; i++)
1420		if (vendor_class->method_table[i])
1421			return 1;
1422	return 0;
1423}
1424
1425static int find_vendor_oui(struct ib_mad_mgmt_vendor_class *vendor_class,
1426			   const char *oui)
1427{
1428	int i;
1429
1430	for (i = 0; i < MAX_MGMT_OUI; i++)
1431		/* Is there matching OUI for this vendor class ? */
1432		if (!memcmp(vendor_class->oui[i], oui, 3))
1433			return i;
1434
1435	return -1;
1436}
1437
1438static int check_vendor_table(struct ib_mad_mgmt_vendor_class_table *vendor)
1439{
1440	int i;
1441
1442	for (i = 0; i < MAX_MGMT_VENDOR_RANGE2; i++)
1443		if (vendor->vendor_class[i])
1444			return 1;
1445
1446	return 0;
1447}
1448
1449static void remove_methods_mad_agent(struct ib_mad_mgmt_method_table *method,
1450				     struct ib_mad_agent_private *agent)
1451{
1452	int i;
1453
1454	/* Remove any methods for this mad agent */
1455	for (i = 0; i < IB_MGMT_MAX_METHODS; i++) {
1456		if (method->agent[i] == agent) {
1457			method->agent[i] = NULL;
1458		}
1459	}
1460}
1461
1462static int add_nonoui_reg_req(struct ib_mad_reg_req *mad_reg_req,
1463			      struct ib_mad_agent_private *agent_priv,
1464			      u8 mgmt_class)
1465{
1466	struct ib_mad_port_private *port_priv;
1467	struct ib_mad_mgmt_class_table **class;
1468	struct ib_mad_mgmt_method_table **method;
1469	int i, ret;
1470
1471	port_priv = agent_priv->qp_info->port_priv;
1472	class = &port_priv->version[mad_reg_req->mgmt_class_version].class;
1473	if (!*class) {
1474		/* Allocate management class table for "new" class version */
1475		*class = kzalloc(sizeof **class, GFP_ATOMIC);
1476		if (!*class) {
 
 
1477			ret = -ENOMEM;
1478			goto error1;
1479		}
1480
1481		/* Allocate method table for this management class */
1482		method = &(*class)->method_table[mgmt_class];
1483		if ((ret = allocate_method_table(method)))
1484			goto error2;
1485	} else {
1486		method = &(*class)->method_table[mgmt_class];
1487		if (!*method) {
1488			/* Allocate method table for this management class */
1489			if ((ret = allocate_method_table(method)))
1490				goto error1;
1491		}
1492	}
1493
1494	/* Now, make sure methods are not already in use */
1495	if (method_in_use(method, mad_reg_req))
1496		goto error3;
1497
1498	/* Finally, add in methods being registered */
1499	for_each_set_bit(i, mad_reg_req->method_mask, IB_MGMT_MAX_METHODS)
1500		(*method)->agent[i] = agent_priv;
1501
1502	return 0;
1503
1504error3:
1505	/* Remove any methods for this mad agent */
1506	remove_methods_mad_agent(*method, agent_priv);
1507	/* Now, check to see if there are any methods in use */
1508	if (!check_method_table(*method)) {
1509		/* If not, release management method table */
1510		kfree(*method);
1511		*method = NULL;
1512	}
1513	ret = -EINVAL;
1514	goto error1;
1515error2:
1516	kfree(*class);
1517	*class = NULL;
1518error1:
1519	return ret;
1520}
1521
1522static int add_oui_reg_req(struct ib_mad_reg_req *mad_reg_req,
1523			   struct ib_mad_agent_private *agent_priv)
1524{
1525	struct ib_mad_port_private *port_priv;
1526	struct ib_mad_mgmt_vendor_class_table **vendor_table;
1527	struct ib_mad_mgmt_vendor_class_table *vendor = NULL;
1528	struct ib_mad_mgmt_vendor_class *vendor_class = NULL;
1529	struct ib_mad_mgmt_method_table **method;
1530	int i, ret = -ENOMEM;
1531	u8 vclass;
1532
1533	/* "New" vendor (with OUI) class */
1534	vclass = vendor_class_index(mad_reg_req->mgmt_class);
1535	port_priv = agent_priv->qp_info->port_priv;
1536	vendor_table = &port_priv->version[
1537				mad_reg_req->mgmt_class_version].vendor;
1538	if (!*vendor_table) {
1539		/* Allocate mgmt vendor class table for "new" class version */
1540		vendor = kzalloc(sizeof *vendor, GFP_ATOMIC);
1541		if (!vendor)
 
 
1542			goto error1;
 
1543
1544		*vendor_table = vendor;
1545	}
1546	if (!(*vendor_table)->vendor_class[vclass]) {
1547		/* Allocate table for this management vendor class */
1548		vendor_class = kzalloc(sizeof *vendor_class, GFP_ATOMIC);
1549		if (!vendor_class)
 
 
1550			goto error2;
 
1551
1552		(*vendor_table)->vendor_class[vclass] = vendor_class;
1553	}
1554	for (i = 0; i < MAX_MGMT_OUI; i++) {
1555		/* Is there matching OUI for this vendor class ? */
1556		if (!memcmp((*vendor_table)->vendor_class[vclass]->oui[i],
1557			    mad_reg_req->oui, 3)) {
1558			method = &(*vendor_table)->vendor_class[
1559						vclass]->method_table[i];
1560			BUG_ON(!*method);
1561			goto check_in_use;
1562		}
1563	}
1564	for (i = 0; i < MAX_MGMT_OUI; i++) {
1565		/* OUI slot available ? */
1566		if (!is_vendor_oui((*vendor_table)->vendor_class[
1567				vclass]->oui[i])) {
1568			method = &(*vendor_table)->vendor_class[
1569				vclass]->method_table[i];
1570			BUG_ON(*method);
1571			/* Allocate method table for this OUI */
1572			if ((ret = allocate_method_table(method)))
1573				goto error3;
1574			memcpy((*vendor_table)->vendor_class[vclass]->oui[i],
1575			       mad_reg_req->oui, 3);
1576			goto check_in_use;
1577		}
1578	}
1579	dev_err(&agent_priv->agent.device->dev, "All OUI slots in use\n");
1580	goto error3;
1581
1582check_in_use:
1583	/* Now, make sure methods are not already in use */
1584	if (method_in_use(method, mad_reg_req))
1585		goto error4;
1586
1587	/* Finally, add in methods being registered */
1588	for_each_set_bit(i, mad_reg_req->method_mask, IB_MGMT_MAX_METHODS)
1589		(*method)->agent[i] = agent_priv;
1590
1591	return 0;
1592
1593error4:
1594	/* Remove any methods for this mad agent */
1595	remove_methods_mad_agent(*method, agent_priv);
1596	/* Now, check to see if there are any methods in use */
1597	if (!check_method_table(*method)) {
1598		/* If not, release management method table */
1599		kfree(*method);
1600		*method = NULL;
1601	}
1602	ret = -EINVAL;
1603error3:
1604	if (vendor_class) {
1605		(*vendor_table)->vendor_class[vclass] = NULL;
1606		kfree(vendor_class);
1607	}
1608error2:
1609	if (vendor) {
1610		*vendor_table = NULL;
1611		kfree(vendor);
1612	}
1613error1:
1614	return ret;
1615}
1616
1617static void remove_mad_reg_req(struct ib_mad_agent_private *agent_priv)
1618{
1619	struct ib_mad_port_private *port_priv;
1620	struct ib_mad_mgmt_class_table *class;
1621	struct ib_mad_mgmt_method_table *method;
1622	struct ib_mad_mgmt_vendor_class_table *vendor;
1623	struct ib_mad_mgmt_vendor_class *vendor_class;
1624	int index;
1625	u8 mgmt_class;
1626
1627	/*
1628	 * Was MAD registration request supplied
1629	 * with original registration ?
1630	 */
1631	if (!agent_priv->reg_req) {
1632		goto out;
1633	}
1634
1635	port_priv = agent_priv->qp_info->port_priv;
1636	mgmt_class = convert_mgmt_class(agent_priv->reg_req->mgmt_class);
1637	class = port_priv->version[
1638			agent_priv->reg_req->mgmt_class_version].class;
1639	if (!class)
1640		goto vendor_check;
1641
1642	method = class->method_table[mgmt_class];
1643	if (method) {
1644		/* Remove any methods for this mad agent */
1645		remove_methods_mad_agent(method, agent_priv);
1646		/* Now, check to see if there are any methods still in use */
1647		if (!check_method_table(method)) {
1648			/* If not, release management method table */
1649			kfree(method);
1650			class->method_table[mgmt_class] = NULL;
1651			/* Any management classes left ? */
1652			if (!check_class_table(class)) {
1653				/* If not, release management class table */
1654				kfree(class);
1655				port_priv->version[
1656					agent_priv->reg_req->
1657					mgmt_class_version].class = NULL;
1658			}
1659		}
1660	}
1661
1662vendor_check:
1663	if (!is_vendor_class(mgmt_class))
1664		goto out;
1665
1666	/* normalize mgmt_class to vendor range 2 */
1667	mgmt_class = vendor_class_index(agent_priv->reg_req->mgmt_class);
1668	vendor = port_priv->version[
1669			agent_priv->reg_req->mgmt_class_version].vendor;
1670
1671	if (!vendor)
1672		goto out;
1673
1674	vendor_class = vendor->vendor_class[mgmt_class];
1675	if (vendor_class) {
1676		index = find_vendor_oui(vendor_class, agent_priv->reg_req->oui);
1677		if (index < 0)
1678			goto out;
1679		method = vendor_class->method_table[index];
1680		if (method) {
1681			/* Remove any methods for this mad agent */
1682			remove_methods_mad_agent(method, agent_priv);
1683			/*
1684			 * Now, check to see if there are
1685			 * any methods still in use
1686			 */
1687			if (!check_method_table(method)) {
1688				/* If not, release management method table */
1689				kfree(method);
1690				vendor_class->method_table[index] = NULL;
1691				memset(vendor_class->oui[index], 0, 3);
1692				/* Any OUIs left ? */
1693				if (!check_vendor_class(vendor_class)) {
1694					/* If not, release vendor class table */
1695					kfree(vendor_class);
1696					vendor->vendor_class[mgmt_class] = NULL;
1697					/* Any other vendor classes left ? */
1698					if (!check_vendor_table(vendor)) {
1699						kfree(vendor);
1700						port_priv->version[
1701							agent_priv->reg_req->
1702							mgmt_class_version].
1703							vendor = NULL;
1704					}
1705				}
1706			}
1707		}
1708	}
1709
1710out:
1711	return;
1712}
1713
1714static struct ib_mad_agent_private *
1715find_mad_agent(struct ib_mad_port_private *port_priv,
1716	       const struct ib_mad_hdr *mad_hdr)
1717{
1718	struct ib_mad_agent_private *mad_agent = NULL;
1719	unsigned long flags;
1720
1721	spin_lock_irqsave(&port_priv->reg_lock, flags);
1722	if (ib_response_mad(mad_hdr)) {
1723		u32 hi_tid;
1724		struct ib_mad_agent_private *entry;
1725
1726		/*
1727		 * Routing is based on high 32 bits of transaction ID
1728		 * of MAD.
1729		 */
1730		hi_tid = be64_to_cpu(mad_hdr->tid) >> 32;
1731		list_for_each_entry(entry, &port_priv->agent_list, agent_list) {
1732			if (entry->agent.hi_tid == hi_tid) {
1733				mad_agent = entry;
1734				break;
1735			}
1736		}
1737	} else {
1738		struct ib_mad_mgmt_class_table *class;
1739		struct ib_mad_mgmt_method_table *method;
1740		struct ib_mad_mgmt_vendor_class_table *vendor;
1741		struct ib_mad_mgmt_vendor_class *vendor_class;
1742		const struct ib_vendor_mad *vendor_mad;
1743		int index;
1744
1745		/*
1746		 * Routing is based on version, class, and method
1747		 * For "newer" vendor MADs, also based on OUI
1748		 */
1749		if (mad_hdr->class_version >= MAX_MGMT_VERSION)
1750			goto out;
1751		if (!is_vendor_class(mad_hdr->mgmt_class)) {
1752			class = port_priv->version[
1753					mad_hdr->class_version].class;
1754			if (!class)
1755				goto out;
1756			if (convert_mgmt_class(mad_hdr->mgmt_class) >=
1757			    ARRAY_SIZE(class->method_table))
1758				goto out;
1759			method = class->method_table[convert_mgmt_class(
1760							mad_hdr->mgmt_class)];
1761			if (method)
1762				mad_agent = method->agent[mad_hdr->method &
1763							  ~IB_MGMT_METHOD_RESP];
1764		} else {
1765			vendor = port_priv->version[
1766					mad_hdr->class_version].vendor;
1767			if (!vendor)
1768				goto out;
1769			vendor_class = vendor->vendor_class[vendor_class_index(
1770						mad_hdr->mgmt_class)];
1771			if (!vendor_class)
1772				goto out;
1773			/* Find matching OUI */
1774			vendor_mad = (const struct ib_vendor_mad *)mad_hdr;
1775			index = find_vendor_oui(vendor_class, vendor_mad->oui);
1776			if (index == -1)
1777				goto out;
1778			method = vendor_class->method_table[index];
1779			if (method) {
1780				mad_agent = method->agent[mad_hdr->method &
1781							  ~IB_MGMT_METHOD_RESP];
1782			}
1783		}
1784	}
1785
1786	if (mad_agent) {
1787		if (mad_agent->agent.recv_handler)
1788			atomic_inc(&mad_agent->refcount);
1789		else {
1790			dev_notice(&port_priv->device->dev,
1791				   "No receive handler for client %p on port %d\n",
1792				   &mad_agent->agent, port_priv->port_num);
1793			mad_agent = NULL;
1794		}
1795	}
1796out:
1797	spin_unlock_irqrestore(&port_priv->reg_lock, flags);
1798
1799	return mad_agent;
1800}
1801
1802static int validate_mad(const struct ib_mad_hdr *mad_hdr,
1803			const struct ib_mad_qp_info *qp_info,
1804			bool opa)
1805{
1806	int valid = 0;
1807	u32 qp_num = qp_info->qp->qp_num;
1808
1809	/* Make sure MAD base version is understood */
1810	if (mad_hdr->base_version != IB_MGMT_BASE_VERSION &&
1811	    (!opa || mad_hdr->base_version != OPA_MGMT_BASE_VERSION)) {
1812		pr_err("MAD received with unsupported base version %d %s\n",
1813		       mad_hdr->base_version, opa ? "(opa)" : "");
1814		goto out;
1815	}
1816
1817	/* Filter SMI packets sent to other than QP0 */
1818	if ((mad_hdr->mgmt_class == IB_MGMT_CLASS_SUBN_LID_ROUTED) ||
1819	    (mad_hdr->mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)) {
1820		if (qp_num == 0)
1821			valid = 1;
1822	} else {
1823		/* CM attributes other than ClassPortInfo only use Send method */
1824		if ((mad_hdr->mgmt_class == IB_MGMT_CLASS_CM) &&
1825		    (mad_hdr->attr_id != IB_MGMT_CLASSPORTINFO_ATTR_ID) &&
1826		    (mad_hdr->method != IB_MGMT_METHOD_SEND))
1827			goto out;
1828		/* Filter GSI packets sent to QP0 */
1829		if (qp_num != 0)
1830			valid = 1;
1831	}
1832
1833out:
1834	return valid;
1835}
1836
1837static int is_rmpp_data_mad(const struct ib_mad_agent_private *mad_agent_priv,
1838			    const struct ib_mad_hdr *mad_hdr)
1839{
1840	struct ib_rmpp_mad *rmpp_mad;
1841
1842	rmpp_mad = (struct ib_rmpp_mad *)mad_hdr;
1843	return !mad_agent_priv->agent.rmpp_version ||
1844		!ib_mad_kernel_rmpp_agent(&mad_agent_priv->agent) ||
1845		!(ib_get_rmpp_flags(&rmpp_mad->rmpp_hdr) &
1846				    IB_MGMT_RMPP_FLAG_ACTIVE) ||
1847		(rmpp_mad->rmpp_hdr.rmpp_type == IB_MGMT_RMPP_TYPE_DATA);
1848}
1849
1850static inline int rcv_has_same_class(const struct ib_mad_send_wr_private *wr,
1851				     const struct ib_mad_recv_wc *rwc)
1852{
1853	return ((struct ib_mad_hdr *)(wr->send_buf.mad))->mgmt_class ==
1854		rwc->recv_buf.mad->mad_hdr.mgmt_class;
1855}
1856
1857static inline int rcv_has_same_gid(const struct ib_mad_agent_private *mad_agent_priv,
1858				   const struct ib_mad_send_wr_private *wr,
1859				   const struct ib_mad_recv_wc *rwc )
1860{
1861	struct rdma_ah_attr attr;
1862	u8 send_resp, rcv_resp;
1863	union ib_gid sgid;
1864	struct ib_device *device = mad_agent_priv->agent.device;
1865	u8 port_num = mad_agent_priv->agent.port_num;
1866	u8 lmc;
1867	bool has_grh;
1868
1869	send_resp = ib_response_mad((struct ib_mad_hdr *)wr->send_buf.mad);
1870	rcv_resp = ib_response_mad(&rwc->recv_buf.mad->mad_hdr);
1871
1872	if (send_resp == rcv_resp)
1873		/* both requests, or both responses. GIDs different */
1874		return 0;
1875
1876	if (rdma_query_ah(wr->send_buf.ah, &attr))
1877		/* Assume not equal, to avoid false positives. */
1878		return 0;
1879
1880	has_grh = !!(rdma_ah_get_ah_flags(&attr) & IB_AH_GRH);
1881	if (has_grh != !!(rwc->wc->wc_flags & IB_WC_GRH))
1882		/* one has GID, other does not.  Assume different */
1883		return 0;
1884
1885	if (!send_resp && rcv_resp) {
1886		/* is request/response. */
1887		if (!has_grh) {
1888			if (ib_get_cached_lmc(device, port_num, &lmc))
1889				return 0;
1890			return (!lmc || !((rdma_ah_get_path_bits(&attr) ^
1891					   rwc->wc->dlid_path_bits) &
1892					  ((1 << lmc) - 1)));
1893		} else {
1894			const struct ib_global_route *grh =
1895					rdma_ah_read_grh(&attr);
1896
1897			if (ib_get_cached_gid(device, port_num,
1898					      grh->sgid_index, &sgid, NULL))
1899				return 0;
1900			return !memcmp(sgid.raw, rwc->recv_buf.grh->dgid.raw,
1901				       16);
1902		}
1903	}
1904
1905	if (!has_grh)
1906		return rdma_ah_get_dlid(&attr) == rwc->wc->slid;
1907	else
1908		return !memcmp(rdma_ah_read_grh(&attr)->dgid.raw,
1909			       rwc->recv_buf.grh->sgid.raw,
1910			       16);
1911}
1912
1913static inline int is_direct(u8 class)
1914{
1915	return (class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE);
1916}
1917
1918struct ib_mad_send_wr_private*
1919ib_find_send_mad(const struct ib_mad_agent_private *mad_agent_priv,
1920		 const struct ib_mad_recv_wc *wc)
1921{
1922	struct ib_mad_send_wr_private *wr;
1923	const struct ib_mad_hdr *mad_hdr;
1924
1925	mad_hdr = &wc->recv_buf.mad->mad_hdr;
1926
1927	list_for_each_entry(wr, &mad_agent_priv->wait_list, agent_list) {
1928		if ((wr->tid == mad_hdr->tid) &&
1929		    rcv_has_same_class(wr, wc) &&
1930		    /*
1931		     * Don't check GID for direct routed MADs.
1932		     * These might have permissive LIDs.
1933		     */
1934		    (is_direct(mad_hdr->mgmt_class) ||
1935		     rcv_has_same_gid(mad_agent_priv, wr, wc)))
1936			return (wr->status == IB_WC_SUCCESS) ? wr : NULL;
1937	}
1938
1939	/*
1940	 * It's possible to receive the response before we've
1941	 * been notified that the send has completed
1942	 */
1943	list_for_each_entry(wr, &mad_agent_priv->send_list, agent_list) {
1944		if (is_rmpp_data_mad(mad_agent_priv, wr->send_buf.mad) &&
1945		    wr->tid == mad_hdr->tid &&
1946		    wr->timeout &&
1947		    rcv_has_same_class(wr, wc) &&
1948		    /*
1949		     * Don't check GID for direct routed MADs.
1950		     * These might have permissive LIDs.
1951		     */
1952		    (is_direct(mad_hdr->mgmt_class) ||
1953		     rcv_has_same_gid(mad_agent_priv, wr, wc)))
1954			/* Verify request has not been canceled */
1955			return (wr->status == IB_WC_SUCCESS) ? wr : NULL;
1956	}
1957	return NULL;
1958}
1959
1960void ib_mark_mad_done(struct ib_mad_send_wr_private *mad_send_wr)
1961{
1962	mad_send_wr->timeout = 0;
1963	if (mad_send_wr->refcount == 1)
1964		list_move_tail(&mad_send_wr->agent_list,
1965			      &mad_send_wr->mad_agent_priv->done_list);
1966}
1967
1968static void ib_mad_complete_recv(struct ib_mad_agent_private *mad_agent_priv,
1969				 struct ib_mad_recv_wc *mad_recv_wc)
1970{
1971	struct ib_mad_send_wr_private *mad_send_wr;
1972	struct ib_mad_send_wc mad_send_wc;
1973	unsigned long flags;
1974	int ret;
1975
1976	INIT_LIST_HEAD(&mad_recv_wc->rmpp_list);
1977	ret = ib_mad_enforce_security(mad_agent_priv,
1978				      mad_recv_wc->wc->pkey_index);
1979	if (ret) {
1980		ib_free_recv_mad(mad_recv_wc);
1981		deref_mad_agent(mad_agent_priv);
1982		return;
1983	}
1984
1985	list_add(&mad_recv_wc->recv_buf.list, &mad_recv_wc->rmpp_list);
1986	if (ib_mad_kernel_rmpp_agent(&mad_agent_priv->agent)) {
1987		mad_recv_wc = ib_process_rmpp_recv_wc(mad_agent_priv,
1988						      mad_recv_wc);
1989		if (!mad_recv_wc) {
1990			deref_mad_agent(mad_agent_priv);
1991			return;
1992		}
1993	}
1994
1995	/* Complete corresponding request */
1996	if (ib_response_mad(&mad_recv_wc->recv_buf.mad->mad_hdr)) {
1997		spin_lock_irqsave(&mad_agent_priv->lock, flags);
1998		mad_send_wr = ib_find_send_mad(mad_agent_priv, mad_recv_wc);
1999		if (!mad_send_wr) {
2000			spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2001			if (!ib_mad_kernel_rmpp_agent(&mad_agent_priv->agent)
2002			   && ib_is_mad_class_rmpp(mad_recv_wc->recv_buf.mad->mad_hdr.mgmt_class)
2003			   && (ib_get_rmpp_flags(&((struct ib_rmpp_mad *)mad_recv_wc->recv_buf.mad)->rmpp_hdr)
2004					& IB_MGMT_RMPP_FLAG_ACTIVE)) {
2005				/* user rmpp is in effect
2006				 * and this is an active RMPP MAD
2007				 */
2008				mad_agent_priv->agent.recv_handler(
2009						&mad_agent_priv->agent, NULL,
2010						mad_recv_wc);
2011				atomic_dec(&mad_agent_priv->refcount);
2012			} else {
2013				/* not user rmpp, revert to normal behavior and
2014				 * drop the mad */
2015				ib_free_recv_mad(mad_recv_wc);
2016				deref_mad_agent(mad_agent_priv);
2017				return;
2018			}
2019		} else {
2020			ib_mark_mad_done(mad_send_wr);
2021			spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2022
2023			/* Defined behavior is to complete response before request */
2024			mad_agent_priv->agent.recv_handler(
2025					&mad_agent_priv->agent,
2026					&mad_send_wr->send_buf,
2027					mad_recv_wc);
2028			atomic_dec(&mad_agent_priv->refcount);
2029
2030			mad_send_wc.status = IB_WC_SUCCESS;
2031			mad_send_wc.vendor_err = 0;
2032			mad_send_wc.send_buf = &mad_send_wr->send_buf;
2033			ib_mad_complete_send_wr(mad_send_wr, &mad_send_wc);
2034		}
2035	} else {
2036		mad_agent_priv->agent.recv_handler(&mad_agent_priv->agent, NULL,
2037						   mad_recv_wc);
2038		deref_mad_agent(mad_agent_priv);
2039	}
2040
2041	return;
2042}
2043
2044static enum smi_action handle_ib_smi(const struct ib_mad_port_private *port_priv,
2045				     const struct ib_mad_qp_info *qp_info,
2046				     const struct ib_wc *wc,
2047				     int port_num,
2048				     struct ib_mad_private *recv,
2049				     struct ib_mad_private *response)
2050{
2051	enum smi_forward_action retsmi;
2052	struct ib_smp *smp = (struct ib_smp *)recv->mad;
2053
2054	if (smi_handle_dr_smp_recv(smp,
2055				   rdma_cap_ib_switch(port_priv->device),
2056				   port_num,
2057				   port_priv->device->phys_port_cnt) ==
2058				   IB_SMI_DISCARD)
2059		return IB_SMI_DISCARD;
2060
2061	retsmi = smi_check_forward_dr_smp(smp);
2062	if (retsmi == IB_SMI_LOCAL)
2063		return IB_SMI_HANDLE;
2064
2065	if (retsmi == IB_SMI_SEND) { /* don't forward */
2066		if (smi_handle_dr_smp_send(smp,
2067					   rdma_cap_ib_switch(port_priv->device),
2068					   port_num) == IB_SMI_DISCARD)
2069			return IB_SMI_DISCARD;
2070
2071		if (smi_check_local_smp(smp, port_priv->device) == IB_SMI_DISCARD)
2072			return IB_SMI_DISCARD;
2073	} else if (rdma_cap_ib_switch(port_priv->device)) {
2074		/* forward case for switches */
2075		memcpy(response, recv, mad_priv_size(response));
2076		response->header.recv_wc.wc = &response->header.wc;
2077		response->header.recv_wc.recv_buf.mad = (struct ib_mad *)response->mad;
2078		response->header.recv_wc.recv_buf.grh = &response->grh;
2079
2080		agent_send_response((const struct ib_mad_hdr *)response->mad,
2081				    &response->grh, wc,
2082				    port_priv->device,
2083				    smi_get_fwd_port(smp),
2084				    qp_info->qp->qp_num,
2085				    response->mad_size,
2086				    false);
2087
2088		return IB_SMI_DISCARD;
2089	}
2090	return IB_SMI_HANDLE;
2091}
2092
2093static bool generate_unmatched_resp(const struct ib_mad_private *recv,
2094				    struct ib_mad_private *response,
2095				    size_t *resp_len, bool opa)
2096{
2097	const struct ib_mad_hdr *recv_hdr = (const struct ib_mad_hdr *)recv->mad;
2098	struct ib_mad_hdr *resp_hdr = (struct ib_mad_hdr *)response->mad;
2099
2100	if (recv_hdr->method == IB_MGMT_METHOD_GET ||
2101	    recv_hdr->method == IB_MGMT_METHOD_SET) {
2102		memcpy(response, recv, mad_priv_size(response));
2103		response->header.recv_wc.wc = &response->header.wc;
2104		response->header.recv_wc.recv_buf.mad = (struct ib_mad *)response->mad;
2105		response->header.recv_wc.recv_buf.grh = &response->grh;
2106		resp_hdr->method = IB_MGMT_METHOD_GET_RESP;
2107		resp_hdr->status = cpu_to_be16(IB_MGMT_MAD_STATUS_UNSUPPORTED_METHOD_ATTRIB);
2108		if (recv_hdr->mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)
2109			resp_hdr->status |= IB_SMP_DIRECTION;
2110
2111		if (opa && recv_hdr->base_version == OPA_MGMT_BASE_VERSION) {
2112			if (recv_hdr->mgmt_class ==
2113			    IB_MGMT_CLASS_SUBN_LID_ROUTED ||
2114			    recv_hdr->mgmt_class ==
2115			    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)
2116				*resp_len = opa_get_smp_header_size(
2117							(struct opa_smp *)recv->mad);
2118			else
2119				*resp_len = sizeof(struct ib_mad_hdr);
2120		}
2121
2122		return true;
2123	} else {
2124		return false;
2125	}
2126}
2127
2128static enum smi_action
2129handle_opa_smi(struct ib_mad_port_private *port_priv,
2130	       struct ib_mad_qp_info *qp_info,
2131	       struct ib_wc *wc,
2132	       int port_num,
2133	       struct ib_mad_private *recv,
2134	       struct ib_mad_private *response)
2135{
2136	enum smi_forward_action retsmi;
2137	struct opa_smp *smp = (struct opa_smp *)recv->mad;
2138
2139	if (opa_smi_handle_dr_smp_recv(smp,
2140				   rdma_cap_ib_switch(port_priv->device),
2141				   port_num,
2142				   port_priv->device->phys_port_cnt) ==
2143				   IB_SMI_DISCARD)
2144		return IB_SMI_DISCARD;
2145
2146	retsmi = opa_smi_check_forward_dr_smp(smp);
2147	if (retsmi == IB_SMI_LOCAL)
2148		return IB_SMI_HANDLE;
2149
2150	if (retsmi == IB_SMI_SEND) { /* don't forward */
2151		if (opa_smi_handle_dr_smp_send(smp,
2152					   rdma_cap_ib_switch(port_priv->device),
2153					   port_num) == IB_SMI_DISCARD)
2154			return IB_SMI_DISCARD;
2155
2156		if (opa_smi_check_local_smp(smp, port_priv->device) ==
2157		    IB_SMI_DISCARD)
2158			return IB_SMI_DISCARD;
2159
2160	} else if (rdma_cap_ib_switch(port_priv->device)) {
2161		/* forward case for switches */
2162		memcpy(response, recv, mad_priv_size(response));
2163		response->header.recv_wc.wc = &response->header.wc;
2164		response->header.recv_wc.recv_buf.opa_mad =
2165				(struct opa_mad *)response->mad;
2166		response->header.recv_wc.recv_buf.grh = &response->grh;
2167
2168		agent_send_response((const struct ib_mad_hdr *)response->mad,
2169				    &response->grh, wc,
2170				    port_priv->device,
2171				    opa_smi_get_fwd_port(smp),
2172				    qp_info->qp->qp_num,
2173				    recv->header.wc.byte_len,
2174				    true);
2175
2176		return IB_SMI_DISCARD;
2177	}
2178
2179	return IB_SMI_HANDLE;
2180}
2181
2182static enum smi_action
2183handle_smi(struct ib_mad_port_private *port_priv,
2184	   struct ib_mad_qp_info *qp_info,
2185	   struct ib_wc *wc,
2186	   int port_num,
2187	   struct ib_mad_private *recv,
2188	   struct ib_mad_private *response,
2189	   bool opa)
2190{
2191	struct ib_mad_hdr *mad_hdr = (struct ib_mad_hdr *)recv->mad;
2192
2193	if (opa && mad_hdr->base_version == OPA_MGMT_BASE_VERSION &&
2194	    mad_hdr->class_version == OPA_SM_CLASS_VERSION)
2195		return handle_opa_smi(port_priv, qp_info, wc, port_num, recv,
2196				      response);
2197
2198	return handle_ib_smi(port_priv, qp_info, wc, port_num, recv, response);
2199}
2200
2201static void ib_mad_recv_done(struct ib_cq *cq, struct ib_wc *wc)
2202{
2203	struct ib_mad_port_private *port_priv = cq->cq_context;
2204	struct ib_mad_list_head *mad_list =
2205		container_of(wc->wr_cqe, struct ib_mad_list_head, cqe);
2206	struct ib_mad_qp_info *qp_info;
2207	struct ib_mad_private_header *mad_priv_hdr;
2208	struct ib_mad_private *recv, *response = NULL;
 
2209	struct ib_mad_agent_private *mad_agent;
2210	int port_num;
2211	int ret = IB_MAD_RESULT_SUCCESS;
2212	size_t mad_size;
2213	u16 resp_mad_pkey_index = 0;
2214	bool opa;
2215
2216	if (list_empty_careful(&port_priv->port_list))
2217		return;
2218
2219	if (wc->status != IB_WC_SUCCESS) {
2220		/*
2221		 * Receive errors indicate that the QP has entered the error
2222		 * state - error handling/shutdown code will cleanup
2223		 */
2224		return;
2225	}
2226
 
2227	qp_info = mad_list->mad_queue->qp_info;
2228	dequeue_mad(mad_list);
2229
2230	opa = rdma_cap_opa_mad(qp_info->port_priv->device,
2231			       qp_info->port_priv->port_num);
2232
2233	mad_priv_hdr = container_of(mad_list, struct ib_mad_private_header,
2234				    mad_list);
2235	recv = container_of(mad_priv_hdr, struct ib_mad_private, header);
2236	ib_dma_unmap_single(port_priv->device,
2237			    recv->header.mapping,
2238			    mad_priv_dma_size(recv),
 
2239			    DMA_FROM_DEVICE);
2240
2241	/* Setup MAD receive work completion from "normal" work completion */
2242	recv->header.wc = *wc;
2243	recv->header.recv_wc.wc = &recv->header.wc;
2244
2245	if (opa && ((struct ib_mad_hdr *)(recv->mad))->base_version == OPA_MGMT_BASE_VERSION) {
2246		recv->header.recv_wc.mad_len = wc->byte_len - sizeof(struct ib_grh);
2247		recv->header.recv_wc.mad_seg_size = sizeof(struct opa_mad);
2248	} else {
2249		recv->header.recv_wc.mad_len = sizeof(struct ib_mad);
2250		recv->header.recv_wc.mad_seg_size = sizeof(struct ib_mad);
2251	}
2252
2253	recv->header.recv_wc.recv_buf.mad = (struct ib_mad *)recv->mad;
2254	recv->header.recv_wc.recv_buf.grh = &recv->grh;
2255
2256	if (atomic_read(&qp_info->snoop_count))
2257		snoop_recv(qp_info, &recv->header.recv_wc, IB_MAD_SNOOP_RECVS);
2258
2259	/* Validate MAD */
2260	if (!validate_mad((const struct ib_mad_hdr *)recv->mad, qp_info, opa))
2261		goto out;
2262
2263	mad_size = recv->mad_size;
2264	response = alloc_mad_private(mad_size, GFP_KERNEL);
2265	if (!response)
 
2266		goto out;
 
2267
2268	if (rdma_cap_ib_switch(port_priv->device))
2269		port_num = wc->port_num;
2270	else
2271		port_num = port_priv->port_num;
2272
2273	if (((struct ib_mad_hdr *)recv->mad)->mgmt_class ==
2274	    IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE) {
2275		if (handle_smi(port_priv, qp_info, wc, port_num, recv,
2276			       response, opa)
2277		    == IB_SMI_DISCARD)
 
 
 
 
2278			goto out;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2279	}
2280
 
2281	/* Give driver "right of first refusal" on incoming MAD */
2282	if (port_priv->device->process_mad) {
 
 
2283		ret = port_priv->device->process_mad(port_priv->device, 0,
2284						     port_priv->port_num,
2285						     wc, &recv->grh,
2286						     (const struct ib_mad_hdr *)recv->mad,
2287						     recv->mad_size,
2288						     (struct ib_mad_hdr *)response->mad,
2289						     &mad_size, &resp_mad_pkey_index);
2290
2291		if (opa)
2292			wc->pkey_index = resp_mad_pkey_index;
2293
2294		if (ret & IB_MAD_RESULT_SUCCESS) {
2295			if (ret & IB_MAD_RESULT_CONSUMED)
2296				goto out;
2297			if (ret & IB_MAD_RESULT_REPLY) {
2298				agent_send_response((const struct ib_mad_hdr *)response->mad,
2299						    &recv->grh, wc,
2300						    port_priv->device,
2301						    port_num,
2302						    qp_info->qp->qp_num,
2303						    mad_size, opa);
2304				goto out;
2305			}
2306		}
2307	}
2308
2309	mad_agent = find_mad_agent(port_priv, (const struct ib_mad_hdr *)recv->mad);
2310	if (mad_agent) {
2311		ib_mad_complete_recv(mad_agent, &recv->header.recv_wc);
2312		/*
2313		 * recv is freed up in error cases in ib_mad_complete_recv
2314		 * or via recv_handler in ib_mad_complete_recv()
2315		 */
2316		recv = NULL;
2317	} else if ((ret & IB_MAD_RESULT_SUCCESS) &&
2318		   generate_unmatched_resp(recv, response, &mad_size, opa)) {
2319		agent_send_response((const struct ib_mad_hdr *)response->mad, &recv->grh, wc,
2320				    port_priv->device, port_num,
2321				    qp_info->qp->qp_num, mad_size, opa);
2322	}
2323
2324out:
2325	/* Post another receive request for this QP */
2326	if (response) {
2327		ib_mad_post_receive_mads(qp_info, response);
2328		kfree(recv);
 
2329	} else
2330		ib_mad_post_receive_mads(qp_info, recv);
2331}
2332
2333static void adjust_timeout(struct ib_mad_agent_private *mad_agent_priv)
2334{
2335	struct ib_mad_send_wr_private *mad_send_wr;
2336	unsigned long delay;
2337
2338	if (list_empty(&mad_agent_priv->wait_list)) {
2339		cancel_delayed_work(&mad_agent_priv->timed_work);
2340	} else {
2341		mad_send_wr = list_entry(mad_agent_priv->wait_list.next,
2342					 struct ib_mad_send_wr_private,
2343					 agent_list);
2344
2345		if (time_after(mad_agent_priv->timeout,
2346			       mad_send_wr->timeout)) {
2347			mad_agent_priv->timeout = mad_send_wr->timeout;
 
2348			delay = mad_send_wr->timeout - jiffies;
2349			if ((long)delay <= 0)
2350				delay = 1;
2351			mod_delayed_work(mad_agent_priv->qp_info->port_priv->wq,
2352					 &mad_agent_priv->timed_work, delay);
 
2353		}
2354	}
2355}
2356
2357static void wait_for_response(struct ib_mad_send_wr_private *mad_send_wr)
2358{
2359	struct ib_mad_agent_private *mad_agent_priv;
2360	struct ib_mad_send_wr_private *temp_mad_send_wr;
2361	struct list_head *list_item;
2362	unsigned long delay;
2363
2364	mad_agent_priv = mad_send_wr->mad_agent_priv;
2365	list_del(&mad_send_wr->agent_list);
2366
2367	delay = mad_send_wr->timeout;
2368	mad_send_wr->timeout += jiffies;
2369
2370	if (delay) {
2371		list_for_each_prev(list_item, &mad_agent_priv->wait_list) {
2372			temp_mad_send_wr = list_entry(list_item,
2373						struct ib_mad_send_wr_private,
2374						agent_list);
2375			if (time_after(mad_send_wr->timeout,
2376				       temp_mad_send_wr->timeout))
2377				break;
2378		}
2379	}
2380	else
2381		list_item = &mad_agent_priv->wait_list;
2382	list_add(&mad_send_wr->agent_list, list_item);
2383
2384	/* Reschedule a work item if we have a shorter timeout */
2385	if (mad_agent_priv->wait_list.next == &mad_send_wr->agent_list)
2386		mod_delayed_work(mad_agent_priv->qp_info->port_priv->wq,
2387				 &mad_agent_priv->timed_work, delay);
 
 
2388}
2389
2390void ib_reset_mad_timeout(struct ib_mad_send_wr_private *mad_send_wr,
2391			  int timeout_ms)
2392{
2393	mad_send_wr->timeout = msecs_to_jiffies(timeout_ms);
2394	wait_for_response(mad_send_wr);
2395}
2396
2397/*
2398 * Process a send work completion
2399 */
2400void ib_mad_complete_send_wr(struct ib_mad_send_wr_private *mad_send_wr,
2401			     struct ib_mad_send_wc *mad_send_wc)
2402{
2403	struct ib_mad_agent_private	*mad_agent_priv;
2404	unsigned long			flags;
2405	int				ret;
2406
2407	mad_agent_priv = mad_send_wr->mad_agent_priv;
2408	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2409	if (ib_mad_kernel_rmpp_agent(&mad_agent_priv->agent)) {
2410		ret = ib_process_rmpp_send_wc(mad_send_wr, mad_send_wc);
2411		if (ret == IB_RMPP_RESULT_CONSUMED)
2412			goto done;
2413	} else
2414		ret = IB_RMPP_RESULT_UNHANDLED;
2415
2416	if (mad_send_wc->status != IB_WC_SUCCESS &&
2417	    mad_send_wr->status == IB_WC_SUCCESS) {
2418		mad_send_wr->status = mad_send_wc->status;
2419		mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2420	}
2421
2422	if (--mad_send_wr->refcount > 0) {
2423		if (mad_send_wr->refcount == 1 && mad_send_wr->timeout &&
2424		    mad_send_wr->status == IB_WC_SUCCESS) {
2425			wait_for_response(mad_send_wr);
2426		}
2427		goto done;
2428	}
2429
2430	/* Remove send from MAD agent and notify client of completion */
2431	list_del(&mad_send_wr->agent_list);
2432	adjust_timeout(mad_agent_priv);
2433	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2434
2435	if (mad_send_wr->status != IB_WC_SUCCESS )
2436		mad_send_wc->status = mad_send_wr->status;
2437	if (ret == IB_RMPP_RESULT_INTERNAL)
2438		ib_rmpp_send_handler(mad_send_wc);
2439	else
2440		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2441						   mad_send_wc);
2442
2443	/* Release reference on agent taken when sending */
2444	deref_mad_agent(mad_agent_priv);
2445	return;
2446done:
2447	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2448}
2449
2450static void ib_mad_send_done(struct ib_cq *cq, struct ib_wc *wc)
 
2451{
2452	struct ib_mad_port_private *port_priv = cq->cq_context;
2453	struct ib_mad_list_head *mad_list =
2454		container_of(wc->wr_cqe, struct ib_mad_list_head, cqe);
2455	struct ib_mad_send_wr_private	*mad_send_wr, *queued_send_wr;
 
2456	struct ib_mad_qp_info		*qp_info;
2457	struct ib_mad_queue		*send_queue;
2458	struct ib_send_wr		*bad_send_wr;
2459	struct ib_mad_send_wc		mad_send_wc;
2460	unsigned long flags;
2461	int ret;
2462
2463	if (list_empty_careful(&port_priv->port_list))
2464		return;
2465
2466	if (wc->status != IB_WC_SUCCESS) {
2467		if (!ib_mad_send_error(port_priv, wc))
2468			return;
2469	}
2470
2471	mad_send_wr = container_of(mad_list, struct ib_mad_send_wr_private,
2472				   mad_list);
2473	send_queue = mad_list->mad_queue;
2474	qp_info = send_queue->qp_info;
2475
2476retry:
2477	ib_dma_unmap_single(mad_send_wr->send_buf.mad_agent->device,
2478			    mad_send_wr->header_mapping,
2479			    mad_send_wr->sg_list[0].length, DMA_TO_DEVICE);
2480	ib_dma_unmap_single(mad_send_wr->send_buf.mad_agent->device,
2481			    mad_send_wr->payload_mapping,
2482			    mad_send_wr->sg_list[1].length, DMA_TO_DEVICE);
2483	queued_send_wr = NULL;
2484	spin_lock_irqsave(&send_queue->lock, flags);
2485	list_del(&mad_list->list);
2486
2487	/* Move queued send to the send queue */
2488	if (send_queue->count-- > send_queue->max_active) {
2489		mad_list = container_of(qp_info->overflow_list.next,
2490					struct ib_mad_list_head, list);
2491		queued_send_wr = container_of(mad_list,
2492					struct ib_mad_send_wr_private,
2493					mad_list);
2494		list_move_tail(&mad_list->list, &send_queue->list);
2495	}
2496	spin_unlock_irqrestore(&send_queue->lock, flags);
2497
2498	mad_send_wc.send_buf = &mad_send_wr->send_buf;
2499	mad_send_wc.status = wc->status;
2500	mad_send_wc.vendor_err = wc->vendor_err;
2501	if (atomic_read(&qp_info->snoop_count))
2502		snoop_send(qp_info, &mad_send_wr->send_buf, &mad_send_wc,
2503			   IB_MAD_SNOOP_SEND_COMPLETIONS);
2504	ib_mad_complete_send_wr(mad_send_wr, &mad_send_wc);
2505
2506	if (queued_send_wr) {
2507		ret = ib_post_send(qp_info->qp, &queued_send_wr->send_wr.wr,
2508				   &bad_send_wr);
2509		if (ret) {
2510			dev_err(&port_priv->device->dev,
2511				"ib_post_send failed: %d\n", ret);
2512			mad_send_wr = queued_send_wr;
2513			wc->status = IB_WC_LOC_QP_OP_ERR;
2514			goto retry;
2515		}
2516	}
2517}
2518
2519static void mark_sends_for_retry(struct ib_mad_qp_info *qp_info)
2520{
2521	struct ib_mad_send_wr_private *mad_send_wr;
2522	struct ib_mad_list_head *mad_list;
2523	unsigned long flags;
2524
2525	spin_lock_irqsave(&qp_info->send_queue.lock, flags);
2526	list_for_each_entry(mad_list, &qp_info->send_queue.list, list) {
2527		mad_send_wr = container_of(mad_list,
2528					   struct ib_mad_send_wr_private,
2529					   mad_list);
2530		mad_send_wr->retry = 1;
2531	}
2532	spin_unlock_irqrestore(&qp_info->send_queue.lock, flags);
2533}
2534
2535static bool ib_mad_send_error(struct ib_mad_port_private *port_priv,
2536		struct ib_wc *wc)
2537{
2538	struct ib_mad_list_head *mad_list =
2539		container_of(wc->wr_cqe, struct ib_mad_list_head, cqe);
2540	struct ib_mad_qp_info *qp_info = mad_list->mad_queue->qp_info;
2541	struct ib_mad_send_wr_private *mad_send_wr;
2542	int ret;
2543
 
 
 
 
 
 
 
 
 
 
2544	/*
2545	 * Send errors will transition the QP to SQE - move
2546	 * QP to RTS and repost flushed work requests
2547	 */
2548	mad_send_wr = container_of(mad_list, struct ib_mad_send_wr_private,
2549				   mad_list);
2550	if (wc->status == IB_WC_WR_FLUSH_ERR) {
2551		if (mad_send_wr->retry) {
2552			/* Repost send */
2553			struct ib_send_wr *bad_send_wr;
2554
2555			mad_send_wr->retry = 0;
2556			ret = ib_post_send(qp_info->qp, &mad_send_wr->send_wr.wr,
2557					&bad_send_wr);
2558			if (!ret)
2559				return false;
2560		}
 
2561	} else {
2562		struct ib_qp_attr *attr;
2563
2564		/* Transition QP to RTS and fail offending send */
2565		attr = kmalloc(sizeof *attr, GFP_KERNEL);
2566		if (attr) {
2567			attr->qp_state = IB_QPS_RTS;
2568			attr->cur_qp_state = IB_QPS_SQE;
2569			ret = ib_modify_qp(qp_info->qp, attr,
2570					   IB_QP_STATE | IB_QP_CUR_STATE);
2571			kfree(attr);
2572			if (ret)
2573				dev_err(&port_priv->device->dev,
2574					"%s - ib_modify_qp to RTS: %d\n",
2575					__func__, ret);
2576			else
2577				mark_sends_for_retry(qp_info);
2578		}
 
2579	}
 
2580
2581	return true;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2582}
2583
2584static void cancel_mads(struct ib_mad_agent_private *mad_agent_priv)
2585{
2586	unsigned long flags;
2587	struct ib_mad_send_wr_private *mad_send_wr, *temp_mad_send_wr;
2588	struct ib_mad_send_wc mad_send_wc;
2589	struct list_head cancel_list;
2590
2591	INIT_LIST_HEAD(&cancel_list);
2592
2593	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2594	list_for_each_entry_safe(mad_send_wr, temp_mad_send_wr,
2595				 &mad_agent_priv->send_list, agent_list) {
2596		if (mad_send_wr->status == IB_WC_SUCCESS) {
2597			mad_send_wr->status = IB_WC_WR_FLUSH_ERR;
2598			mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2599		}
2600	}
2601
2602	/* Empty wait list to prevent receives from finding a request */
2603	list_splice_init(&mad_agent_priv->wait_list, &cancel_list);
2604	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2605
2606	/* Report all cancelled requests */
2607	mad_send_wc.status = IB_WC_WR_FLUSH_ERR;
2608	mad_send_wc.vendor_err = 0;
2609
2610	list_for_each_entry_safe(mad_send_wr, temp_mad_send_wr,
2611				 &cancel_list, agent_list) {
2612		mad_send_wc.send_buf = &mad_send_wr->send_buf;
2613		list_del(&mad_send_wr->agent_list);
2614		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2615						   &mad_send_wc);
2616		atomic_dec(&mad_agent_priv->refcount);
2617	}
2618}
2619
2620static struct ib_mad_send_wr_private*
2621find_send_wr(struct ib_mad_agent_private *mad_agent_priv,
2622	     struct ib_mad_send_buf *send_buf)
2623{
2624	struct ib_mad_send_wr_private *mad_send_wr;
2625
2626	list_for_each_entry(mad_send_wr, &mad_agent_priv->wait_list,
2627			    agent_list) {
2628		if (&mad_send_wr->send_buf == send_buf)
2629			return mad_send_wr;
2630	}
2631
2632	list_for_each_entry(mad_send_wr, &mad_agent_priv->send_list,
2633			    agent_list) {
2634		if (is_rmpp_data_mad(mad_agent_priv,
2635				     mad_send_wr->send_buf.mad) &&
2636		    &mad_send_wr->send_buf == send_buf)
2637			return mad_send_wr;
2638	}
2639	return NULL;
2640}
2641
2642int ib_modify_mad(struct ib_mad_agent *mad_agent,
2643		  struct ib_mad_send_buf *send_buf, u32 timeout_ms)
2644{
2645	struct ib_mad_agent_private *mad_agent_priv;
2646	struct ib_mad_send_wr_private *mad_send_wr;
2647	unsigned long flags;
2648	int active;
2649
2650	mad_agent_priv = container_of(mad_agent, struct ib_mad_agent_private,
2651				      agent);
2652	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2653	mad_send_wr = find_send_wr(mad_agent_priv, send_buf);
2654	if (!mad_send_wr || mad_send_wr->status != IB_WC_SUCCESS) {
2655		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2656		return -EINVAL;
2657	}
2658
2659	active = (!mad_send_wr->timeout || mad_send_wr->refcount > 1);
2660	if (!timeout_ms) {
2661		mad_send_wr->status = IB_WC_WR_FLUSH_ERR;
2662		mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2663	}
2664
2665	mad_send_wr->send_buf.timeout_ms = timeout_ms;
2666	if (active)
2667		mad_send_wr->timeout = msecs_to_jiffies(timeout_ms);
2668	else
2669		ib_reset_mad_timeout(mad_send_wr, timeout_ms);
2670
2671	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2672	return 0;
2673}
2674EXPORT_SYMBOL(ib_modify_mad);
2675
2676void ib_cancel_mad(struct ib_mad_agent *mad_agent,
2677		   struct ib_mad_send_buf *send_buf)
2678{
2679	ib_modify_mad(mad_agent, send_buf, 0);
2680}
2681EXPORT_SYMBOL(ib_cancel_mad);
2682
2683static void local_completions(struct work_struct *work)
2684{
2685	struct ib_mad_agent_private *mad_agent_priv;
2686	struct ib_mad_local_private *local;
2687	struct ib_mad_agent_private *recv_mad_agent;
2688	unsigned long flags;
2689	int free_mad;
2690	struct ib_wc wc;
2691	struct ib_mad_send_wc mad_send_wc;
2692	bool opa;
2693
2694	mad_agent_priv =
2695		container_of(work, struct ib_mad_agent_private, local_work);
2696
2697	opa = rdma_cap_opa_mad(mad_agent_priv->qp_info->port_priv->device,
2698			       mad_agent_priv->qp_info->port_priv->port_num);
2699
2700	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2701	while (!list_empty(&mad_agent_priv->local_list)) {
2702		local = list_entry(mad_agent_priv->local_list.next,
2703				   struct ib_mad_local_private,
2704				   completion_list);
2705		list_del(&local->completion_list);
2706		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2707		free_mad = 0;
2708		if (local->mad_priv) {
2709			u8 base_version;
2710			recv_mad_agent = local->recv_mad_agent;
2711			if (!recv_mad_agent) {
2712				dev_err(&mad_agent_priv->agent.device->dev,
2713					"No receive MAD agent for local completion\n");
2714				free_mad = 1;
2715				goto local_send_completion;
2716			}
2717
2718			/*
2719			 * Defined behavior is to complete response
2720			 * before request
2721			 */
2722			build_smp_wc(recv_mad_agent->agent.qp,
2723				     local->mad_send_wr->send_wr.wr.wr_cqe,
2724				     be16_to_cpu(IB_LID_PERMISSIVE),
2725				     local->mad_send_wr->send_wr.pkey_index,
2726				     recv_mad_agent->agent.port_num, &wc);
2727
2728			local->mad_priv->header.recv_wc.wc = &wc;
2729
2730			base_version = ((struct ib_mad_hdr *)(local->mad_priv->mad))->base_version;
2731			if (opa && base_version == OPA_MGMT_BASE_VERSION) {
2732				local->mad_priv->header.recv_wc.mad_len = local->return_wc_byte_len;
2733				local->mad_priv->header.recv_wc.mad_seg_size = sizeof(struct opa_mad);
2734			} else {
2735				local->mad_priv->header.recv_wc.mad_len = sizeof(struct ib_mad);
2736				local->mad_priv->header.recv_wc.mad_seg_size = sizeof(struct ib_mad);
2737			}
2738
2739			INIT_LIST_HEAD(&local->mad_priv->header.recv_wc.rmpp_list);
2740			list_add(&local->mad_priv->header.recv_wc.recv_buf.list,
2741				 &local->mad_priv->header.recv_wc.rmpp_list);
2742			local->mad_priv->header.recv_wc.recv_buf.grh = NULL;
2743			local->mad_priv->header.recv_wc.recv_buf.mad =
2744						(struct ib_mad *)local->mad_priv->mad;
2745			if (atomic_read(&recv_mad_agent->qp_info->snoop_count))
2746				snoop_recv(recv_mad_agent->qp_info,
2747					  &local->mad_priv->header.recv_wc,
2748					   IB_MAD_SNOOP_RECVS);
2749			recv_mad_agent->agent.recv_handler(
2750						&recv_mad_agent->agent,
2751						&local->mad_send_wr->send_buf,
2752						&local->mad_priv->header.recv_wc);
2753			spin_lock_irqsave(&recv_mad_agent->lock, flags);
2754			atomic_dec(&recv_mad_agent->refcount);
2755			spin_unlock_irqrestore(&recv_mad_agent->lock, flags);
2756		}
2757
2758local_send_completion:
2759		/* Complete send */
2760		mad_send_wc.status = IB_WC_SUCCESS;
2761		mad_send_wc.vendor_err = 0;
2762		mad_send_wc.send_buf = &local->mad_send_wr->send_buf;
2763		if (atomic_read(&mad_agent_priv->qp_info->snoop_count))
2764			snoop_send(mad_agent_priv->qp_info,
2765				   &local->mad_send_wr->send_buf,
2766				   &mad_send_wc, IB_MAD_SNOOP_SEND_COMPLETIONS);
2767		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2768						   &mad_send_wc);
2769
2770		spin_lock_irqsave(&mad_agent_priv->lock, flags);
2771		atomic_dec(&mad_agent_priv->refcount);
2772		if (free_mad)
2773			kfree(local->mad_priv);
2774		kfree(local);
2775	}
2776	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2777}
2778
2779static int retry_send(struct ib_mad_send_wr_private *mad_send_wr)
2780{
2781	int ret;
2782
2783	if (!mad_send_wr->retries_left)
2784		return -ETIMEDOUT;
2785
2786	mad_send_wr->retries_left--;
2787	mad_send_wr->send_buf.retries++;
2788
2789	mad_send_wr->timeout = msecs_to_jiffies(mad_send_wr->send_buf.timeout_ms);
2790
2791	if (ib_mad_kernel_rmpp_agent(&mad_send_wr->mad_agent_priv->agent)) {
2792		ret = ib_retry_rmpp(mad_send_wr);
2793		switch (ret) {
2794		case IB_RMPP_RESULT_UNHANDLED:
2795			ret = ib_send_mad(mad_send_wr);
2796			break;
2797		case IB_RMPP_RESULT_CONSUMED:
2798			ret = 0;
2799			break;
2800		default:
2801			ret = -ECOMM;
2802			break;
2803		}
2804	} else
2805		ret = ib_send_mad(mad_send_wr);
2806
2807	if (!ret) {
2808		mad_send_wr->refcount++;
2809		list_add_tail(&mad_send_wr->agent_list,
2810			      &mad_send_wr->mad_agent_priv->send_list);
2811	}
2812	return ret;
2813}
2814
2815static void timeout_sends(struct work_struct *work)
2816{
2817	struct ib_mad_agent_private *mad_agent_priv;
2818	struct ib_mad_send_wr_private *mad_send_wr;
2819	struct ib_mad_send_wc mad_send_wc;
2820	unsigned long flags, delay;
2821
2822	mad_agent_priv = container_of(work, struct ib_mad_agent_private,
2823				      timed_work.work);
2824	mad_send_wc.vendor_err = 0;
2825
2826	spin_lock_irqsave(&mad_agent_priv->lock, flags);
2827	while (!list_empty(&mad_agent_priv->wait_list)) {
2828		mad_send_wr = list_entry(mad_agent_priv->wait_list.next,
2829					 struct ib_mad_send_wr_private,
2830					 agent_list);
2831
2832		if (time_after(mad_send_wr->timeout, jiffies)) {
2833			delay = mad_send_wr->timeout - jiffies;
2834			if ((long)delay <= 0)
2835				delay = 1;
2836			queue_delayed_work(mad_agent_priv->qp_info->
2837					   port_priv->wq,
2838					   &mad_agent_priv->timed_work, delay);
2839			break;
2840		}
2841
2842		list_del(&mad_send_wr->agent_list);
2843		if (mad_send_wr->status == IB_WC_SUCCESS &&
2844		    !retry_send(mad_send_wr))
2845			continue;
2846
2847		spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2848
2849		if (mad_send_wr->status == IB_WC_SUCCESS)
2850			mad_send_wc.status = IB_WC_RESP_TIMEOUT_ERR;
2851		else
2852			mad_send_wc.status = mad_send_wr->status;
2853		mad_send_wc.send_buf = &mad_send_wr->send_buf;
2854		mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2855						   &mad_send_wc);
2856
2857		atomic_dec(&mad_agent_priv->refcount);
2858		spin_lock_irqsave(&mad_agent_priv->lock, flags);
2859	}
2860	spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2861}
2862
 
 
 
 
 
 
 
 
 
 
 
2863/*
2864 * Allocate receive MADs and post receive WRs for them
2865 */
2866static int ib_mad_post_receive_mads(struct ib_mad_qp_info *qp_info,
2867				    struct ib_mad_private *mad)
2868{
2869	unsigned long flags;
2870	int post, ret;
2871	struct ib_mad_private *mad_priv;
2872	struct ib_sge sg_list;
2873	struct ib_recv_wr recv_wr, *bad_recv_wr;
2874	struct ib_mad_queue *recv_queue = &qp_info->recv_queue;
2875
2876	/* Initialize common scatter list fields */
2877	sg_list.lkey = qp_info->port_priv->pd->local_dma_lkey;
 
2878
2879	/* Initialize common receive WR fields */
2880	recv_wr.next = NULL;
2881	recv_wr.sg_list = &sg_list;
2882	recv_wr.num_sge = 1;
2883
2884	do {
2885		/* Allocate and map receive buffer */
2886		if (mad) {
2887			mad_priv = mad;
2888			mad = NULL;
2889		} else {
2890			mad_priv = alloc_mad_private(port_mad_size(qp_info->port_priv),
2891						     GFP_ATOMIC);
2892			if (!mad_priv) {
 
2893				ret = -ENOMEM;
2894				break;
2895			}
2896		}
2897		sg_list.length = mad_priv_dma_size(mad_priv);
2898		sg_list.addr = ib_dma_map_single(qp_info->port_priv->device,
2899						 &mad_priv->grh,
2900						 mad_priv_dma_size(mad_priv),
 
2901						 DMA_FROM_DEVICE);
2902		if (unlikely(ib_dma_mapping_error(qp_info->port_priv->device,
2903						  sg_list.addr))) {
2904			ret = -ENOMEM;
2905			break;
2906		}
2907		mad_priv->header.mapping = sg_list.addr;
 
2908		mad_priv->header.mad_list.mad_queue = recv_queue;
2909		mad_priv->header.mad_list.cqe.done = ib_mad_recv_done;
2910		recv_wr.wr_cqe = &mad_priv->header.mad_list.cqe;
2911
2912		/* Post receive WR */
2913		spin_lock_irqsave(&recv_queue->lock, flags);
2914		post = (++recv_queue->count < recv_queue->max_active);
2915		list_add_tail(&mad_priv->header.mad_list.list, &recv_queue->list);
2916		spin_unlock_irqrestore(&recv_queue->lock, flags);
2917		ret = ib_post_recv(qp_info->qp, &recv_wr, &bad_recv_wr);
2918		if (ret) {
2919			spin_lock_irqsave(&recv_queue->lock, flags);
2920			list_del(&mad_priv->header.mad_list.list);
2921			recv_queue->count--;
2922			spin_unlock_irqrestore(&recv_queue->lock, flags);
2923			ib_dma_unmap_single(qp_info->port_priv->device,
2924					    mad_priv->header.mapping,
2925					    mad_priv_dma_size(mad_priv),
 
2926					    DMA_FROM_DEVICE);
2927			kfree(mad_priv);
2928			dev_err(&qp_info->port_priv->device->dev,
2929				"ib_post_recv failed: %d\n", ret);
2930			break;
2931		}
2932	} while (post);
2933
2934	return ret;
2935}
2936
2937/*
2938 * Return all the posted receive MADs
2939 */
2940static void cleanup_recv_queue(struct ib_mad_qp_info *qp_info)
2941{
2942	struct ib_mad_private_header *mad_priv_hdr;
2943	struct ib_mad_private *recv;
2944	struct ib_mad_list_head *mad_list;
2945
2946	if (!qp_info->qp)
2947		return;
2948
2949	while (!list_empty(&qp_info->recv_queue.list)) {
2950
2951		mad_list = list_entry(qp_info->recv_queue.list.next,
2952				      struct ib_mad_list_head, list);
2953		mad_priv_hdr = container_of(mad_list,
2954					    struct ib_mad_private_header,
2955					    mad_list);
2956		recv = container_of(mad_priv_hdr, struct ib_mad_private,
2957				    header);
2958
2959		/* Remove from posted receive MAD list */
2960		list_del(&mad_list->list);
2961
2962		ib_dma_unmap_single(qp_info->port_priv->device,
2963				    recv->header.mapping,
2964				    mad_priv_dma_size(recv),
 
2965				    DMA_FROM_DEVICE);
2966		kfree(recv);
2967	}
2968
2969	qp_info->recv_queue.count = 0;
2970}
2971
2972/*
2973 * Start the port
2974 */
2975static int ib_mad_port_start(struct ib_mad_port_private *port_priv)
2976{
2977	int ret, i;
2978	struct ib_qp_attr *attr;
2979	struct ib_qp *qp;
2980	u16 pkey_index;
2981
2982	attr = kmalloc(sizeof *attr, GFP_KERNEL);
2983	if (!attr)
 
2984		return -ENOMEM;
2985
2986	ret = ib_find_pkey(port_priv->device, port_priv->port_num,
2987			   IB_DEFAULT_PKEY_FULL, &pkey_index);
2988	if (ret)
2989		pkey_index = 0;
2990
2991	for (i = 0; i < IB_MAD_QPS_CORE; i++) {
2992		qp = port_priv->qp_info[i].qp;
2993		if (!qp)
2994			continue;
2995
2996		/*
2997		 * PKey index for QP1 is irrelevant but
2998		 * one is needed for the Reset to Init transition
2999		 */
3000		attr->qp_state = IB_QPS_INIT;
3001		attr->pkey_index = pkey_index;
3002		attr->qkey = (qp->qp_num == 0) ? 0 : IB_QP1_QKEY;
3003		ret = ib_modify_qp(qp, attr, IB_QP_STATE |
3004					     IB_QP_PKEY_INDEX | IB_QP_QKEY);
3005		if (ret) {
3006			dev_err(&port_priv->device->dev,
3007				"Couldn't change QP%d state to INIT: %d\n",
3008				i, ret);
3009			goto out;
3010		}
3011
3012		attr->qp_state = IB_QPS_RTR;
3013		ret = ib_modify_qp(qp, attr, IB_QP_STATE);
3014		if (ret) {
3015			dev_err(&port_priv->device->dev,
3016				"Couldn't change QP%d state to RTR: %d\n",
3017				i, ret);
3018			goto out;
3019		}
3020
3021		attr->qp_state = IB_QPS_RTS;
3022		attr->sq_psn = IB_MAD_SEND_Q_PSN;
3023		ret = ib_modify_qp(qp, attr, IB_QP_STATE | IB_QP_SQ_PSN);
3024		if (ret) {
3025			dev_err(&port_priv->device->dev,
3026				"Couldn't change QP%d state to RTS: %d\n",
3027				i, ret);
3028			goto out;
3029		}
3030	}
3031
3032	ret = ib_req_notify_cq(port_priv->cq, IB_CQ_NEXT_COMP);
3033	if (ret) {
3034		dev_err(&port_priv->device->dev,
3035			"Failed to request completion notification: %d\n",
3036			ret);
3037		goto out;
3038	}
3039
3040	for (i = 0; i < IB_MAD_QPS_CORE; i++) {
3041		if (!port_priv->qp_info[i].qp)
3042			continue;
3043
3044		ret = ib_mad_post_receive_mads(&port_priv->qp_info[i], NULL);
3045		if (ret) {
3046			dev_err(&port_priv->device->dev,
3047				"Couldn't post receive WRs\n");
3048			goto out;
3049		}
3050	}
3051out:
3052	kfree(attr);
3053	return ret;
3054}
3055
3056static void qp_event_handler(struct ib_event *event, void *qp_context)
3057{
3058	struct ib_mad_qp_info	*qp_info = qp_context;
3059
3060	/* It's worse than that! He's dead, Jim! */
3061	dev_err(&qp_info->port_priv->device->dev,
3062		"Fatal error (%d) on MAD QP (%d)\n",
3063		event->event, qp_info->qp->qp_num);
3064}
3065
3066static void init_mad_queue(struct ib_mad_qp_info *qp_info,
3067			   struct ib_mad_queue *mad_queue)
3068{
3069	mad_queue->qp_info = qp_info;
3070	mad_queue->count = 0;
3071	spin_lock_init(&mad_queue->lock);
3072	INIT_LIST_HEAD(&mad_queue->list);
3073}
3074
3075static void init_mad_qp(struct ib_mad_port_private *port_priv,
3076			struct ib_mad_qp_info *qp_info)
3077{
3078	qp_info->port_priv = port_priv;
3079	init_mad_queue(qp_info, &qp_info->send_queue);
3080	init_mad_queue(qp_info, &qp_info->recv_queue);
3081	INIT_LIST_HEAD(&qp_info->overflow_list);
3082	spin_lock_init(&qp_info->snoop_lock);
3083	qp_info->snoop_table = NULL;
3084	qp_info->snoop_table_size = 0;
3085	atomic_set(&qp_info->snoop_count, 0);
3086}
3087
3088static int create_mad_qp(struct ib_mad_qp_info *qp_info,
3089			 enum ib_qp_type qp_type)
3090{
3091	struct ib_qp_init_attr	qp_init_attr;
3092	int ret;
3093
3094	memset(&qp_init_attr, 0, sizeof qp_init_attr);
3095	qp_init_attr.send_cq = qp_info->port_priv->cq;
3096	qp_init_attr.recv_cq = qp_info->port_priv->cq;
3097	qp_init_attr.sq_sig_type = IB_SIGNAL_ALL_WR;
3098	qp_init_attr.cap.max_send_wr = mad_sendq_size;
3099	qp_init_attr.cap.max_recv_wr = mad_recvq_size;
3100	qp_init_attr.cap.max_send_sge = IB_MAD_SEND_REQ_MAX_SG;
3101	qp_init_attr.cap.max_recv_sge = IB_MAD_RECV_REQ_MAX_SG;
3102	qp_init_attr.qp_type = qp_type;
3103	qp_init_attr.port_num = qp_info->port_priv->port_num;
3104	qp_init_attr.qp_context = qp_info;
3105	qp_init_attr.event_handler = qp_event_handler;
3106	qp_info->qp = ib_create_qp(qp_info->port_priv->pd, &qp_init_attr);
3107	if (IS_ERR(qp_info->qp)) {
3108		dev_err(&qp_info->port_priv->device->dev,
3109			"Couldn't create ib_mad QP%d\n",
3110			get_spl_qp_index(qp_type));
3111		ret = PTR_ERR(qp_info->qp);
3112		goto error;
3113	}
3114	/* Use minimum queue sizes unless the CQ is resized */
3115	qp_info->send_queue.max_active = mad_sendq_size;
3116	qp_info->recv_queue.max_active = mad_recvq_size;
3117	return 0;
3118
3119error:
3120	return ret;
3121}
3122
3123static void destroy_mad_qp(struct ib_mad_qp_info *qp_info)
3124{
3125	if (!qp_info->qp)
3126		return;
3127
3128	ib_destroy_qp(qp_info->qp);
3129	kfree(qp_info->snoop_table);
3130}
3131
3132/*
3133 * Open the port
3134 * Create the QP, PD, MR, and CQ if needed
3135 */
3136static int ib_mad_port_open(struct ib_device *device,
3137			    int port_num)
3138{
3139	int ret, cq_size;
3140	struct ib_mad_port_private *port_priv;
3141	unsigned long flags;
3142	char name[sizeof "ib_mad123"];
3143	int has_smi;
3144
3145	if (WARN_ON(rdma_max_mad_size(device, port_num) < IB_MGMT_MAD_SIZE))
3146		return -EFAULT;
3147
3148	if (WARN_ON(rdma_cap_opa_mad(device, port_num) &&
3149		    rdma_max_mad_size(device, port_num) < OPA_MGMT_MAD_SIZE))
3150		return -EFAULT;
3151
3152	/* Create new device info */
3153	port_priv = kzalloc(sizeof *port_priv, GFP_KERNEL);
3154	if (!port_priv)
 
3155		return -ENOMEM;
 
3156
3157	port_priv->device = device;
3158	port_priv->port_num = port_num;
3159	spin_lock_init(&port_priv->reg_lock);
3160	INIT_LIST_HEAD(&port_priv->agent_list);
3161	init_mad_qp(port_priv, &port_priv->qp_info[0]);
3162	init_mad_qp(port_priv, &port_priv->qp_info[1]);
3163
3164	cq_size = mad_sendq_size + mad_recvq_size;
3165	has_smi = rdma_cap_ib_smi(device, port_num);
3166	if (has_smi)
3167		cq_size *= 2;
3168
3169	port_priv->cq = ib_alloc_cq(port_priv->device, port_priv, cq_size, 0,
3170			IB_POLL_WORKQUEUE);
 
3171	if (IS_ERR(port_priv->cq)) {
3172		dev_err(&device->dev, "Couldn't create ib_mad CQ\n");
3173		ret = PTR_ERR(port_priv->cq);
3174		goto error3;
3175	}
3176
3177	port_priv->pd = ib_alloc_pd(device, 0);
3178	if (IS_ERR(port_priv->pd)) {
3179		dev_err(&device->dev, "Couldn't create ib_mad PD\n");
3180		ret = PTR_ERR(port_priv->pd);
3181		goto error4;
3182	}
3183
 
 
 
 
 
 
 
3184	if (has_smi) {
3185		ret = create_mad_qp(&port_priv->qp_info[0], IB_QPT_SMI);
3186		if (ret)
3187			goto error6;
3188	}
3189	ret = create_mad_qp(&port_priv->qp_info[1], IB_QPT_GSI);
3190	if (ret)
3191		goto error7;
3192
3193	snprintf(name, sizeof name, "ib_mad%d", port_num);
3194	port_priv->wq = alloc_ordered_workqueue(name, WQ_MEM_RECLAIM);
3195	if (!port_priv->wq) {
3196		ret = -ENOMEM;
3197		goto error8;
3198	}
 
3199
3200	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
3201	list_add_tail(&port_priv->port_list, &ib_mad_port_list);
3202	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
3203
3204	ret = ib_mad_port_start(port_priv);
3205	if (ret) {
3206		dev_err(&device->dev, "Couldn't start port\n");
3207		goto error9;
3208	}
3209
3210	return 0;
3211
3212error9:
3213	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
3214	list_del_init(&port_priv->port_list);
3215	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
3216
3217	destroy_workqueue(port_priv->wq);
3218error8:
3219	destroy_mad_qp(&port_priv->qp_info[1]);
3220error7:
3221	destroy_mad_qp(&port_priv->qp_info[0]);
3222error6:
 
 
3223	ib_dealloc_pd(port_priv->pd);
3224error4:
3225	ib_free_cq(port_priv->cq);
3226	cleanup_recv_queue(&port_priv->qp_info[1]);
3227	cleanup_recv_queue(&port_priv->qp_info[0]);
3228error3:
3229	kfree(port_priv);
3230
3231	return ret;
3232}
3233
3234/*
3235 * Close the port
3236 * If there are no classes using the port, free the port
3237 * resources (CQ, MR, PD, QP) and remove the port's info structure
3238 */
3239static int ib_mad_port_close(struct ib_device *device, int port_num)
3240{
3241	struct ib_mad_port_private *port_priv;
3242	unsigned long flags;
3243
3244	spin_lock_irqsave(&ib_mad_port_list_lock, flags);
3245	port_priv = __ib_get_mad_port(device, port_num);
3246	if (port_priv == NULL) {
3247		spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
3248		dev_err(&device->dev, "Port %d not found\n", port_num);
3249		return -ENODEV;
3250	}
3251	list_del_init(&port_priv->port_list);
3252	spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
3253
3254	destroy_workqueue(port_priv->wq);
3255	destroy_mad_qp(&port_priv->qp_info[1]);
3256	destroy_mad_qp(&port_priv->qp_info[0]);
 
3257	ib_dealloc_pd(port_priv->pd);
3258	ib_free_cq(port_priv->cq);
3259	cleanup_recv_queue(&port_priv->qp_info[1]);
3260	cleanup_recv_queue(&port_priv->qp_info[0]);
3261	/* XXX: Handle deallocation of MAD registration tables */
3262
3263	kfree(port_priv);
3264
3265	return 0;
3266}
3267
3268static void ib_mad_init_device(struct ib_device *device)
3269{
3270	int start, i;
3271
3272	start = rdma_start_port(device);
 
3273
3274	for (i = start; i <= rdma_end_port(device); i++) {
3275		if (!rdma_cap_ib_mad(device, i))
3276			continue;
 
 
 
 
3277
 
3278		if (ib_mad_port_open(device, i)) {
3279			dev_err(&device->dev, "Couldn't open port %d\n", i);
 
3280			goto error;
3281		}
3282		if (ib_agent_port_open(device, i)) {
3283			dev_err(&device->dev,
3284				"Couldn't open port %d for agents\n", i);
 
3285			goto error_agent;
3286		}
3287	}
3288	return;
3289
3290error_agent:
3291	if (ib_mad_port_close(device, i))
3292		dev_err(&device->dev, "Couldn't close port %d\n", i);
 
3293
3294error:
3295	while (--i >= start) {
3296		if (!rdma_cap_ib_mad(device, i))
3297			continue;
3298
 
3299		if (ib_agent_port_close(device, i))
3300			dev_err(&device->dev,
3301				"Couldn't close port %d for agents\n", i);
 
3302		if (ib_mad_port_close(device, i))
3303			dev_err(&device->dev, "Couldn't close port %d\n", i);
 
 
3304	}
3305}
3306
3307static void ib_mad_remove_device(struct ib_device *device, void *client_data)
3308{
3309	int i;
3310
3311	for (i = rdma_start_port(device); i <= rdma_end_port(device); i++) {
3312		if (!rdma_cap_ib_mad(device, i))
3313			continue;
3314
3315		if (ib_agent_port_close(device, i))
3316			dev_err(&device->dev,
3317				"Couldn't close port %d for agents\n", i);
3318		if (ib_mad_port_close(device, i))
3319			dev_err(&device->dev, "Couldn't close port %d\n", i);
 
 
 
 
 
 
 
 
 
 
3320	}
3321}
3322
3323static struct ib_client mad_client = {
3324	.name   = "mad",
3325	.add = ib_mad_init_device,
3326	.remove = ib_mad_remove_device
3327};
3328
3329int ib_mad_init(void)
3330{
 
 
3331	mad_recvq_size = min(mad_recvq_size, IB_MAD_QP_MAX_SIZE);
3332	mad_recvq_size = max(mad_recvq_size, IB_MAD_QP_MIN_SIZE);
3333
3334	mad_sendq_size = min(mad_sendq_size, IB_MAD_QP_MAX_SIZE);
3335	mad_sendq_size = max(mad_sendq_size, IB_MAD_QP_MIN_SIZE);
3336
 
 
 
 
 
 
 
 
 
 
 
3337	INIT_LIST_HEAD(&ib_mad_port_list);
3338
3339	if (ib_register_client(&mad_client)) {
3340		pr_err("Couldn't register ib_mad client\n");
3341		return -EINVAL;
 
3342	}
3343
3344	return 0;
 
 
 
 
 
3345}
3346
3347void ib_mad_cleanup(void)
3348{
3349	ib_unregister_client(&mad_client);
 
3350}