]> git.karo-electronics.de Git - karo-tx-linux.git/blob - drivers/net/ethernet/mellanox/mlx4/resource_tracker.c
net/mlx4_core: Fix potential corruption in counters database
[karo-tx-linux.git] / drivers / net / ethernet / mellanox / mlx4 / resource_tracker.c
1 /*
2  * Copyright (c) 2004, 2005 Topspin Communications.  All rights reserved.
3  * Copyright (c) 2005, 2006, 2007, 2008 Mellanox Technologies.
4  * All rights reserved.
5  * Copyright (c) 2005, 2006, 2007 Cisco Systems, Inc.  All rights reserved.
6  *
7  * This software is available to you under a choice of one of two
8  * licenses.  You may choose to be licensed under the terms of the GNU
9  * General Public License (GPL) Version 2, available from the file
10  * COPYING in the main directory of this source tree, or the
11  * OpenIB.org BSD license below:
12  *
13  *     Redistribution and use in source and binary forms, with or
14  *     without modification, are permitted provided that the following
15  *     conditions are met:
16  *
17  *      - Redistributions of source code must retain the above
18  *        copyright notice, this list of conditions and the following
19  *        disclaimer.
20  *
21  *      - Redistributions in binary form must reproduce the above
22  *        copyright notice, this list of conditions and the following
23  *        disclaimer in the documentation and/or other materials
24  *        provided with the distribution.
25  *
26  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
27  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
28  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
29  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
30  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
31  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
32  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
33  * SOFTWARE.
34  */
35
36 #include <linux/sched.h>
37 #include <linux/pci.h>
38 #include <linux/errno.h>
39 #include <linux/kernel.h>
40 #include <linux/io.h>
41 #include <linux/slab.h>
42 #include <linux/mlx4/cmd.h>
43 #include <linux/mlx4/qp.h>
44 #include <linux/if_ether.h>
45 #include <linux/etherdevice.h>
46
47 #include "mlx4.h"
48 #include "fw.h"
49 #include "mlx4_stats.h"
50
51 #define MLX4_MAC_VALID          (1ull << 63)
52 #define MLX4_PF_COUNTERS_PER_PORT       2
53 #define MLX4_VF_COUNTERS_PER_PORT       1
54
55 struct mac_res {
56         struct list_head list;
57         u64 mac;
58         int ref_count;
59         u8 smac_index;
60         u8 port;
61 };
62
63 struct vlan_res {
64         struct list_head list;
65         u16 vlan;
66         int ref_count;
67         int vlan_index;
68         u8 port;
69 };
70
71 struct res_common {
72         struct list_head        list;
73         struct rb_node          node;
74         u64                     res_id;
75         int                     owner;
76         int                     state;
77         int                     from_state;
78         int                     to_state;
79         int                     removing;
80 };
81
82 enum {
83         RES_ANY_BUSY = 1
84 };
85
86 struct res_gid {
87         struct list_head        list;
88         u8                      gid[16];
89         enum mlx4_protocol      prot;
90         enum mlx4_steer_type    steer;
91         u64                     reg_id;
92 };
93
94 enum res_qp_states {
95         RES_QP_BUSY = RES_ANY_BUSY,
96
97         /* QP number was allocated */
98         RES_QP_RESERVED,
99
100         /* ICM memory for QP context was mapped */
101         RES_QP_MAPPED,
102
103         /* QP is in hw ownership */
104         RES_QP_HW
105 };
106
107 struct res_qp {
108         struct res_common       com;
109         struct res_mtt         *mtt;
110         struct res_cq          *rcq;
111         struct res_cq          *scq;
112         struct res_srq         *srq;
113         struct list_head        mcg_list;
114         spinlock_t              mcg_spl;
115         int                     local_qpn;
116         atomic_t                ref_count;
117         u32                     qpc_flags;
118         /* saved qp params before VST enforcement in order to restore on VGT */
119         u8                      sched_queue;
120         __be32                  param3;
121         u8                      vlan_control;
122         u8                      fvl_rx;
123         u8                      pri_path_fl;
124         u8                      vlan_index;
125         u8                      feup;
126 };
127
128 enum res_mtt_states {
129         RES_MTT_BUSY = RES_ANY_BUSY,
130         RES_MTT_ALLOCATED,
131 };
132
133 static inline const char *mtt_states_str(enum res_mtt_states state)
134 {
135         switch (state) {
136         case RES_MTT_BUSY: return "RES_MTT_BUSY";
137         case RES_MTT_ALLOCATED: return "RES_MTT_ALLOCATED";
138         default: return "Unknown";
139         }
140 }
141
142 struct res_mtt {
143         struct res_common       com;
144         int                     order;
145         atomic_t                ref_count;
146 };
147
148 enum res_mpt_states {
149         RES_MPT_BUSY = RES_ANY_BUSY,
150         RES_MPT_RESERVED,
151         RES_MPT_MAPPED,
152         RES_MPT_HW,
153 };
154
155 struct res_mpt {
156         struct res_common       com;
157         struct res_mtt         *mtt;
158         int                     key;
159 };
160
161 enum res_eq_states {
162         RES_EQ_BUSY = RES_ANY_BUSY,
163         RES_EQ_RESERVED,
164         RES_EQ_HW,
165 };
166
167 struct res_eq {
168         struct res_common       com;
169         struct res_mtt         *mtt;
170 };
171
172 enum res_cq_states {
173         RES_CQ_BUSY = RES_ANY_BUSY,
174         RES_CQ_ALLOCATED,
175         RES_CQ_HW,
176 };
177
178 struct res_cq {
179         struct res_common       com;
180         struct res_mtt         *mtt;
181         atomic_t                ref_count;
182 };
183
184 enum res_srq_states {
185         RES_SRQ_BUSY = RES_ANY_BUSY,
186         RES_SRQ_ALLOCATED,
187         RES_SRQ_HW,
188 };
189
190 struct res_srq {
191         struct res_common       com;
192         struct res_mtt         *mtt;
193         struct res_cq          *cq;
194         atomic_t                ref_count;
195 };
196
197 enum res_counter_states {
198         RES_COUNTER_BUSY = RES_ANY_BUSY,
199         RES_COUNTER_ALLOCATED,
200 };
201
202 struct res_counter {
203         struct res_common       com;
204         int                     port;
205 };
206
207 enum res_xrcdn_states {
208         RES_XRCD_BUSY = RES_ANY_BUSY,
209         RES_XRCD_ALLOCATED,
210 };
211
212 struct res_xrcdn {
213         struct res_common       com;
214         int                     port;
215 };
216
217 enum res_fs_rule_states {
218         RES_FS_RULE_BUSY = RES_ANY_BUSY,
219         RES_FS_RULE_ALLOCATED,
220 };
221
222 struct res_fs_rule {
223         struct res_common       com;
224         int                     qpn;
225         /* VF DMFS mbox with port flipped */
226         void                    *mirr_mbox;
227         /* > 0 --> apply mirror when getting into HA mode      */
228         /* = 0 --> un-apply mirror when getting out of HA mode */
229         u32                     mirr_mbox_size;
230         struct list_head        mirr_list;
231         u64                     mirr_rule_id;
232 };
233
234 static void *res_tracker_lookup(struct rb_root *root, u64 res_id)
235 {
236         struct rb_node *node = root->rb_node;
237
238         while (node) {
239                 struct res_common *res = container_of(node, struct res_common,
240                                                       node);
241
242                 if (res_id < res->res_id)
243                         node = node->rb_left;
244                 else if (res_id > res->res_id)
245                         node = node->rb_right;
246                 else
247                         return res;
248         }
249         return NULL;
250 }
251
252 static int res_tracker_insert(struct rb_root *root, struct res_common *res)
253 {
254         struct rb_node **new = &(root->rb_node), *parent = NULL;
255
256         /* Figure out where to put new node */
257         while (*new) {
258                 struct res_common *this = container_of(*new, struct res_common,
259                                                        node);
260
261                 parent = *new;
262                 if (res->res_id < this->res_id)
263                         new = &((*new)->rb_left);
264                 else if (res->res_id > this->res_id)
265                         new = &((*new)->rb_right);
266                 else
267                         return -EEXIST;
268         }
269
270         /* Add new node and rebalance tree. */
271         rb_link_node(&res->node, parent, new);
272         rb_insert_color(&res->node, root);
273
274         return 0;
275 }
276
277 enum qp_transition {
278         QP_TRANS_INIT2RTR,
279         QP_TRANS_RTR2RTS,
280         QP_TRANS_RTS2RTS,
281         QP_TRANS_SQERR2RTS,
282         QP_TRANS_SQD2SQD,
283         QP_TRANS_SQD2RTS
284 };
285
286 /* For Debug uses */
287 static const char *resource_str(enum mlx4_resource rt)
288 {
289         switch (rt) {
290         case RES_QP: return "RES_QP";
291         case RES_CQ: return "RES_CQ";
292         case RES_SRQ: return "RES_SRQ";
293         case RES_MPT: return "RES_MPT";
294         case RES_MTT: return "RES_MTT";
295         case RES_MAC: return  "RES_MAC";
296         case RES_VLAN: return  "RES_VLAN";
297         case RES_EQ: return "RES_EQ";
298         case RES_COUNTER: return "RES_COUNTER";
299         case RES_FS_RULE: return "RES_FS_RULE";
300         case RES_XRCD: return "RES_XRCD";
301         default: return "Unknown resource type !!!";
302         };
303 }
304
305 static void rem_slave_vlans(struct mlx4_dev *dev, int slave);
306 static inline int mlx4_grant_resource(struct mlx4_dev *dev, int slave,
307                                       enum mlx4_resource res_type, int count,
308                                       int port)
309 {
310         struct mlx4_priv *priv = mlx4_priv(dev);
311         struct resource_allocator *res_alloc =
312                 &priv->mfunc.master.res_tracker.res_alloc[res_type];
313         int err = -EINVAL;
314         int allocated, free, reserved, guaranteed, from_free;
315         int from_rsvd;
316
317         if (slave > dev->persist->num_vfs)
318                 return -EINVAL;
319
320         spin_lock(&res_alloc->alloc_lock);
321         allocated = (port > 0) ?
322                 res_alloc->allocated[(port - 1) *
323                 (dev->persist->num_vfs + 1) + slave] :
324                 res_alloc->allocated[slave];
325         free = (port > 0) ? res_alloc->res_port_free[port - 1] :
326                 res_alloc->res_free;
327         reserved = (port > 0) ? res_alloc->res_port_rsvd[port - 1] :
328                 res_alloc->res_reserved;
329         guaranteed = res_alloc->guaranteed[slave];
330
331         if (allocated + count > res_alloc->quota[slave]) {
332                 mlx4_warn(dev, "VF %d port %d res %s: quota exceeded, count %d alloc %d quota %d\n",
333                           slave, port, resource_str(res_type), count,
334                           allocated, res_alloc->quota[slave]);
335                 goto out;
336         }
337
338         if (allocated + count <= guaranteed) {
339                 err = 0;
340                 from_rsvd = count;
341         } else {
342                 /* portion may need to be obtained from free area */
343                 if (guaranteed - allocated > 0)
344                         from_free = count - (guaranteed - allocated);
345                 else
346                         from_free = count;
347
348                 from_rsvd = count - from_free;
349
350                 if (free - from_free >= reserved)
351                         err = 0;
352                 else
353                         mlx4_warn(dev, "VF %d port %d res %s: free pool empty, free %d from_free %d rsvd %d\n",
354                                   slave, port, resource_str(res_type), free,
355                                   from_free, reserved);
356         }
357
358         if (!err) {
359                 /* grant the request */
360                 if (port > 0) {
361                         res_alloc->allocated[(port - 1) *
362                         (dev->persist->num_vfs + 1) + slave] += count;
363                         res_alloc->res_port_free[port - 1] -= count;
364                         res_alloc->res_port_rsvd[port - 1] -= from_rsvd;
365                 } else {
366                         res_alloc->allocated[slave] += count;
367                         res_alloc->res_free -= count;
368                         res_alloc->res_reserved -= from_rsvd;
369                 }
370         }
371
372 out:
373         spin_unlock(&res_alloc->alloc_lock);
374         return err;
375 }
376
377 static inline void mlx4_release_resource(struct mlx4_dev *dev, int slave,
378                                     enum mlx4_resource res_type, int count,
379                                     int port)
380 {
381         struct mlx4_priv *priv = mlx4_priv(dev);
382         struct resource_allocator *res_alloc =
383                 &priv->mfunc.master.res_tracker.res_alloc[res_type];
384         int allocated, guaranteed, from_rsvd;
385
386         if (slave > dev->persist->num_vfs)
387                 return;
388
389         spin_lock(&res_alloc->alloc_lock);
390
391         allocated = (port > 0) ?
392                 res_alloc->allocated[(port - 1) *
393                 (dev->persist->num_vfs + 1) + slave] :
394                 res_alloc->allocated[slave];
395         guaranteed = res_alloc->guaranteed[slave];
396
397         if (allocated - count >= guaranteed) {
398                 from_rsvd = 0;
399         } else {
400                 /* portion may need to be returned to reserved area */
401                 if (allocated - guaranteed > 0)
402                         from_rsvd = count - (allocated - guaranteed);
403                 else
404                         from_rsvd = count;
405         }
406
407         if (port > 0) {
408                 res_alloc->allocated[(port - 1) *
409                 (dev->persist->num_vfs + 1) + slave] -= count;
410                 res_alloc->res_port_free[port - 1] += count;
411                 res_alloc->res_port_rsvd[port - 1] += from_rsvd;
412         } else {
413                 res_alloc->allocated[slave] -= count;
414                 res_alloc->res_free += count;
415                 res_alloc->res_reserved += from_rsvd;
416         }
417
418         spin_unlock(&res_alloc->alloc_lock);
419         return;
420 }
421
422 static inline void initialize_res_quotas(struct mlx4_dev *dev,
423                                          struct resource_allocator *res_alloc,
424                                          enum mlx4_resource res_type,
425                                          int vf, int num_instances)
426 {
427         res_alloc->guaranteed[vf] = num_instances /
428                                     (2 * (dev->persist->num_vfs + 1));
429         res_alloc->quota[vf] = (num_instances / 2) + res_alloc->guaranteed[vf];
430         if (vf == mlx4_master_func_num(dev)) {
431                 res_alloc->res_free = num_instances;
432                 if (res_type == RES_MTT) {
433                         /* reserved mtts will be taken out of the PF allocation */
434                         res_alloc->res_free += dev->caps.reserved_mtts;
435                         res_alloc->guaranteed[vf] += dev->caps.reserved_mtts;
436                         res_alloc->quota[vf] += dev->caps.reserved_mtts;
437                 }
438         }
439 }
440
441 void mlx4_init_quotas(struct mlx4_dev *dev)
442 {
443         struct mlx4_priv *priv = mlx4_priv(dev);
444         int pf;
445
446         /* quotas for VFs are initialized in mlx4_slave_cap */
447         if (mlx4_is_slave(dev))
448                 return;
449
450         if (!mlx4_is_mfunc(dev)) {
451                 dev->quotas.qp = dev->caps.num_qps - dev->caps.reserved_qps -
452                         mlx4_num_reserved_sqps(dev);
453                 dev->quotas.cq = dev->caps.num_cqs - dev->caps.reserved_cqs;
454                 dev->quotas.srq = dev->caps.num_srqs - dev->caps.reserved_srqs;
455                 dev->quotas.mtt = dev->caps.num_mtts - dev->caps.reserved_mtts;
456                 dev->quotas.mpt = dev->caps.num_mpts - dev->caps.reserved_mrws;
457                 return;
458         }
459
460         pf = mlx4_master_func_num(dev);
461         dev->quotas.qp =
462                 priv->mfunc.master.res_tracker.res_alloc[RES_QP].quota[pf];
463         dev->quotas.cq =
464                 priv->mfunc.master.res_tracker.res_alloc[RES_CQ].quota[pf];
465         dev->quotas.srq =
466                 priv->mfunc.master.res_tracker.res_alloc[RES_SRQ].quota[pf];
467         dev->quotas.mtt =
468                 priv->mfunc.master.res_tracker.res_alloc[RES_MTT].quota[pf];
469         dev->quotas.mpt =
470                 priv->mfunc.master.res_tracker.res_alloc[RES_MPT].quota[pf];
471 }
472
473 static int get_max_gauranteed_vfs_counter(struct mlx4_dev *dev)
474 {
475         /* reduce the sink counter */
476         return (dev->caps.max_counters - 1 -
477                 (MLX4_PF_COUNTERS_PER_PORT * MLX4_MAX_PORTS))
478                 / MLX4_MAX_PORTS;
479 }
480
481 int mlx4_init_resource_tracker(struct mlx4_dev *dev)
482 {
483         struct mlx4_priv *priv = mlx4_priv(dev);
484         int i, j;
485         int t;
486         int max_vfs_guarantee_counter = get_max_gauranteed_vfs_counter(dev);
487
488         priv->mfunc.master.res_tracker.slave_list =
489                 kzalloc(dev->num_slaves * sizeof(struct slave_list),
490                         GFP_KERNEL);
491         if (!priv->mfunc.master.res_tracker.slave_list)
492                 return -ENOMEM;
493
494         for (i = 0 ; i < dev->num_slaves; i++) {
495                 for (t = 0; t < MLX4_NUM_OF_RESOURCE_TYPE; ++t)
496                         INIT_LIST_HEAD(&priv->mfunc.master.res_tracker.
497                                        slave_list[i].res_list[t]);
498                 mutex_init(&priv->mfunc.master.res_tracker.slave_list[i].mutex);
499         }
500
501         mlx4_dbg(dev, "Started init_resource_tracker: %ld slaves\n",
502                  dev->num_slaves);
503         for (i = 0 ; i < MLX4_NUM_OF_RESOURCE_TYPE; i++)
504                 priv->mfunc.master.res_tracker.res_tree[i] = RB_ROOT;
505
506         for (i = 0; i < MLX4_NUM_OF_RESOURCE_TYPE; i++) {
507                 struct resource_allocator *res_alloc =
508                         &priv->mfunc.master.res_tracker.res_alloc[i];
509                 res_alloc->quota = kmalloc((dev->persist->num_vfs + 1) *
510                                            sizeof(int), GFP_KERNEL);
511                 res_alloc->guaranteed = kmalloc((dev->persist->num_vfs + 1) *
512                                                 sizeof(int), GFP_KERNEL);
513                 if (i == RES_MAC || i == RES_VLAN)
514                         res_alloc->allocated = kzalloc(MLX4_MAX_PORTS *
515                                                        (dev->persist->num_vfs
516                                                        + 1) *
517                                                        sizeof(int), GFP_KERNEL);
518                 else
519                         res_alloc->allocated = kzalloc((dev->persist->
520                                                         num_vfs + 1) *
521                                                        sizeof(int), GFP_KERNEL);
522                 /* Reduce the sink counter */
523                 if (i == RES_COUNTER)
524                         res_alloc->res_free = dev->caps.max_counters - 1;
525
526                 if (!res_alloc->quota || !res_alloc->guaranteed ||
527                     !res_alloc->allocated)
528                         goto no_mem_err;
529
530                 spin_lock_init(&res_alloc->alloc_lock);
531                 for (t = 0; t < dev->persist->num_vfs + 1; t++) {
532                         struct mlx4_active_ports actv_ports =
533                                 mlx4_get_active_ports(dev, t);
534                         switch (i) {
535                         case RES_QP:
536                                 initialize_res_quotas(dev, res_alloc, RES_QP,
537                                                       t, dev->caps.num_qps -
538                                                       dev->caps.reserved_qps -
539                                                       mlx4_num_reserved_sqps(dev));
540                                 break;
541                         case RES_CQ:
542                                 initialize_res_quotas(dev, res_alloc, RES_CQ,
543                                                       t, dev->caps.num_cqs -
544                                                       dev->caps.reserved_cqs);
545                                 break;
546                         case RES_SRQ:
547                                 initialize_res_quotas(dev, res_alloc, RES_SRQ,
548                                                       t, dev->caps.num_srqs -
549                                                       dev->caps.reserved_srqs);
550                                 break;
551                         case RES_MPT:
552                                 initialize_res_quotas(dev, res_alloc, RES_MPT,
553                                                       t, dev->caps.num_mpts -
554                                                       dev->caps.reserved_mrws);
555                                 break;
556                         case RES_MTT:
557                                 initialize_res_quotas(dev, res_alloc, RES_MTT,
558                                                       t, dev->caps.num_mtts -
559                                                       dev->caps.reserved_mtts);
560                                 break;
561                         case RES_MAC:
562                                 if (t == mlx4_master_func_num(dev)) {
563                                         int max_vfs_pport = 0;
564                                         /* Calculate the max vfs per port for */
565                                         /* both ports.                        */
566                                         for (j = 0; j < dev->caps.num_ports;
567                                              j++) {
568                                                 struct mlx4_slaves_pport slaves_pport =
569                                                         mlx4_phys_to_slaves_pport(dev, j + 1);
570                                                 unsigned current_slaves =
571                                                         bitmap_weight(slaves_pport.slaves,
572                                                                       dev->caps.num_ports) - 1;
573                                                 if (max_vfs_pport < current_slaves)
574                                                         max_vfs_pport =
575                                                                 current_slaves;
576                                         }
577                                         res_alloc->quota[t] =
578                                                 MLX4_MAX_MAC_NUM -
579                                                 2 * max_vfs_pport;
580                                         res_alloc->guaranteed[t] = 2;
581                                         for (j = 0; j < MLX4_MAX_PORTS; j++)
582                                                 res_alloc->res_port_free[j] =
583                                                         MLX4_MAX_MAC_NUM;
584                                 } else {
585                                         res_alloc->quota[t] = MLX4_MAX_MAC_NUM;
586                                         res_alloc->guaranteed[t] = 2;
587                                 }
588                                 break;
589                         case RES_VLAN:
590                                 if (t == mlx4_master_func_num(dev)) {
591                                         res_alloc->quota[t] = MLX4_MAX_VLAN_NUM;
592                                         res_alloc->guaranteed[t] = MLX4_MAX_VLAN_NUM / 2;
593                                         for (j = 0; j < MLX4_MAX_PORTS; j++)
594                                                 res_alloc->res_port_free[j] =
595                                                         res_alloc->quota[t];
596                                 } else {
597                                         res_alloc->quota[t] = MLX4_MAX_VLAN_NUM / 2;
598                                         res_alloc->guaranteed[t] = 0;
599                                 }
600                                 break;
601                         case RES_COUNTER:
602                                 res_alloc->quota[t] = dev->caps.max_counters;
603                                 if (t == mlx4_master_func_num(dev))
604                                         res_alloc->guaranteed[t] =
605                                                 MLX4_PF_COUNTERS_PER_PORT *
606                                                 MLX4_MAX_PORTS;
607                                 else if (t <= max_vfs_guarantee_counter)
608                                         res_alloc->guaranteed[t] =
609                                                 MLX4_VF_COUNTERS_PER_PORT *
610                                                 MLX4_MAX_PORTS;
611                                 else
612                                         res_alloc->guaranteed[t] = 0;
613                                 res_alloc->res_free -= res_alloc->guaranteed[t];
614                                 break;
615                         default:
616                                 break;
617                         }
618                         if (i == RES_MAC || i == RES_VLAN) {
619                                 for (j = 0; j < dev->caps.num_ports; j++)
620                                         if (test_bit(j, actv_ports.ports))
621                                                 res_alloc->res_port_rsvd[j] +=
622                                                         res_alloc->guaranteed[t];
623                         } else {
624                                 res_alloc->res_reserved += res_alloc->guaranteed[t];
625                         }
626                 }
627         }
628         spin_lock_init(&priv->mfunc.master.res_tracker.lock);
629         return 0;
630
631 no_mem_err:
632         for (i = 0; i < MLX4_NUM_OF_RESOURCE_TYPE; i++) {
633                 kfree(priv->mfunc.master.res_tracker.res_alloc[i].allocated);
634                 priv->mfunc.master.res_tracker.res_alloc[i].allocated = NULL;
635                 kfree(priv->mfunc.master.res_tracker.res_alloc[i].guaranteed);
636                 priv->mfunc.master.res_tracker.res_alloc[i].guaranteed = NULL;
637                 kfree(priv->mfunc.master.res_tracker.res_alloc[i].quota);
638                 priv->mfunc.master.res_tracker.res_alloc[i].quota = NULL;
639         }
640         return -ENOMEM;
641 }
642
643 void mlx4_free_resource_tracker(struct mlx4_dev *dev,
644                                 enum mlx4_res_tracker_free_type type)
645 {
646         struct mlx4_priv *priv = mlx4_priv(dev);
647         int i;
648
649         if (priv->mfunc.master.res_tracker.slave_list) {
650                 if (type != RES_TR_FREE_STRUCTS_ONLY) {
651                         for (i = 0; i < dev->num_slaves; i++) {
652                                 if (type == RES_TR_FREE_ALL ||
653                                     dev->caps.function != i)
654                                         mlx4_delete_all_resources_for_slave(dev, i);
655                         }
656                         /* free master's vlans */
657                         i = dev->caps.function;
658                         mlx4_reset_roce_gids(dev, i);
659                         mutex_lock(&priv->mfunc.master.res_tracker.slave_list[i].mutex);
660                         rem_slave_vlans(dev, i);
661                         mutex_unlock(&priv->mfunc.master.res_tracker.slave_list[i].mutex);
662                 }
663
664                 if (type != RES_TR_FREE_SLAVES_ONLY) {
665                         for (i = 0; i < MLX4_NUM_OF_RESOURCE_TYPE; i++) {
666                                 kfree(priv->mfunc.master.res_tracker.res_alloc[i].allocated);
667                                 priv->mfunc.master.res_tracker.res_alloc[i].allocated = NULL;
668                                 kfree(priv->mfunc.master.res_tracker.res_alloc[i].guaranteed);
669                                 priv->mfunc.master.res_tracker.res_alloc[i].guaranteed = NULL;
670                                 kfree(priv->mfunc.master.res_tracker.res_alloc[i].quota);
671                                 priv->mfunc.master.res_tracker.res_alloc[i].quota = NULL;
672                         }
673                         kfree(priv->mfunc.master.res_tracker.slave_list);
674                         priv->mfunc.master.res_tracker.slave_list = NULL;
675                 }
676         }
677 }
678
679 static void update_pkey_index(struct mlx4_dev *dev, int slave,
680                               struct mlx4_cmd_mailbox *inbox)
681 {
682         u8 sched = *(u8 *)(inbox->buf + 64);
683         u8 orig_index = *(u8 *)(inbox->buf + 35);
684         u8 new_index;
685         struct mlx4_priv *priv = mlx4_priv(dev);
686         int port;
687
688         port = (sched >> 6 & 1) + 1;
689
690         new_index = priv->virt2phys_pkey[slave][port - 1][orig_index];
691         *(u8 *)(inbox->buf + 35) = new_index;
692 }
693
694 static void update_gid(struct mlx4_dev *dev, struct mlx4_cmd_mailbox *inbox,
695                        u8 slave)
696 {
697         struct mlx4_qp_context  *qp_ctx = inbox->buf + 8;
698         enum mlx4_qp_optpar     optpar = be32_to_cpu(*(__be32 *) inbox->buf);
699         u32                     ts = (be32_to_cpu(qp_ctx->flags) >> 16) & 0xff;
700         int port;
701
702         if (MLX4_QP_ST_UD == ts) {
703                 port = (qp_ctx->pri_path.sched_queue >> 6 & 1) + 1;
704                 if (mlx4_is_eth(dev, port))
705                         qp_ctx->pri_path.mgid_index =
706                                 mlx4_get_base_gid_ix(dev, slave, port) | 0x80;
707                 else
708                         qp_ctx->pri_path.mgid_index = slave | 0x80;
709
710         } else if (MLX4_QP_ST_RC == ts || MLX4_QP_ST_XRC == ts || MLX4_QP_ST_UC == ts) {
711                 if (optpar & MLX4_QP_OPTPAR_PRIMARY_ADDR_PATH) {
712                         port = (qp_ctx->pri_path.sched_queue >> 6 & 1) + 1;
713                         if (mlx4_is_eth(dev, port)) {
714                                 qp_ctx->pri_path.mgid_index +=
715                                         mlx4_get_base_gid_ix(dev, slave, port);
716                                 qp_ctx->pri_path.mgid_index &= 0x7f;
717                         } else {
718                                 qp_ctx->pri_path.mgid_index = slave & 0x7F;
719                         }
720                 }
721                 if (optpar & MLX4_QP_OPTPAR_ALT_ADDR_PATH) {
722                         port = (qp_ctx->alt_path.sched_queue >> 6 & 1) + 1;
723                         if (mlx4_is_eth(dev, port)) {
724                                 qp_ctx->alt_path.mgid_index +=
725                                         mlx4_get_base_gid_ix(dev, slave, port);
726                                 qp_ctx->alt_path.mgid_index &= 0x7f;
727                         } else {
728                                 qp_ctx->alt_path.mgid_index = slave & 0x7F;
729                         }
730                 }
731         }
732 }
733
734 static int handle_counter(struct mlx4_dev *dev, struct mlx4_qp_context *qpc,
735                           u8 slave, int port);
736
737 static int update_vport_qp_param(struct mlx4_dev *dev,
738                                  struct mlx4_cmd_mailbox *inbox,
739                                  u8 slave, u32 qpn)
740 {
741         struct mlx4_qp_context  *qpc = inbox->buf + 8;
742         struct mlx4_vport_oper_state *vp_oper;
743         struct mlx4_priv *priv;
744         u32 qp_type;
745         int port, err = 0;
746
747         port = (qpc->pri_path.sched_queue & 0x40) ? 2 : 1;
748         priv = mlx4_priv(dev);
749         vp_oper = &priv->mfunc.master.vf_oper[slave].vport[port];
750         qp_type = (be32_to_cpu(qpc->flags) >> 16) & 0xff;
751
752         err = handle_counter(dev, qpc, slave, port);
753         if (err)
754                 goto out;
755
756         if (MLX4_VGT != vp_oper->state.default_vlan) {
757                 /* the reserved QPs (special, proxy, tunnel)
758                  * do not operate over vlans
759                  */
760                 if (mlx4_is_qp_reserved(dev, qpn))
761                         return 0;
762
763                 /* force strip vlan by clear vsd, MLX QP refers to Raw Ethernet */
764                 if (qp_type == MLX4_QP_ST_UD ||
765                     (qp_type == MLX4_QP_ST_MLX && mlx4_is_eth(dev, port))) {
766                         if (dev->caps.bmme_flags & MLX4_BMME_FLAG_VSD_INIT2RTR) {
767                                 *(__be32 *)inbox->buf =
768                                         cpu_to_be32(be32_to_cpu(*(__be32 *)inbox->buf) |
769                                         MLX4_QP_OPTPAR_VLAN_STRIPPING);
770                                 qpc->param3 &= ~cpu_to_be32(MLX4_STRIP_VLAN);
771                         } else {
772                                 struct mlx4_update_qp_params params = {.flags = 0};
773
774                                 err = mlx4_update_qp(dev, qpn, MLX4_UPDATE_QP_VSD, &params);
775                                 if (err)
776                                         goto out;
777                         }
778                 }
779
780                 /* preserve IF_COUNTER flag */
781                 qpc->pri_path.vlan_control &=
782                         MLX4_CTRL_ETH_SRC_CHECK_IF_COUNTER;
783                 if (vp_oper->state.link_state == IFLA_VF_LINK_STATE_DISABLE &&
784                     dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_UPDATE_QP) {
785                         qpc->pri_path.vlan_control |=
786                                 MLX4_VLAN_CTRL_ETH_TX_BLOCK_TAGGED |
787                                 MLX4_VLAN_CTRL_ETH_TX_BLOCK_PRIO_TAGGED |
788                                 MLX4_VLAN_CTRL_ETH_TX_BLOCK_UNTAGGED |
789                                 MLX4_VLAN_CTRL_ETH_RX_BLOCK_PRIO_TAGGED |
790                                 MLX4_VLAN_CTRL_ETH_RX_BLOCK_UNTAGGED |
791                                 MLX4_VLAN_CTRL_ETH_RX_BLOCK_TAGGED;
792                 } else if (0 != vp_oper->state.default_vlan) {
793                         qpc->pri_path.vlan_control |=
794                                 MLX4_VLAN_CTRL_ETH_TX_BLOCK_TAGGED |
795                                 MLX4_VLAN_CTRL_ETH_RX_BLOCK_PRIO_TAGGED |
796                                 MLX4_VLAN_CTRL_ETH_RX_BLOCK_UNTAGGED;
797                 } else { /* priority tagged */
798                         qpc->pri_path.vlan_control |=
799                                 MLX4_VLAN_CTRL_ETH_TX_BLOCK_TAGGED |
800                                 MLX4_VLAN_CTRL_ETH_RX_BLOCK_TAGGED;
801                 }
802
803                 qpc->pri_path.fvl_rx |= MLX4_FVL_RX_FORCE_ETH_VLAN;
804                 qpc->pri_path.vlan_index = vp_oper->vlan_idx;
805                 qpc->pri_path.fl |= MLX4_FL_CV | MLX4_FL_ETH_HIDE_CQE_VLAN;
806                 qpc->pri_path.feup |= MLX4_FEUP_FORCE_ETH_UP | MLX4_FVL_FORCE_ETH_VLAN;
807                 qpc->pri_path.sched_queue &= 0xC7;
808                 qpc->pri_path.sched_queue |= (vp_oper->state.default_qos) << 3;
809                 qpc->qos_vport = vp_oper->state.qos_vport;
810         }
811         if (vp_oper->state.spoofchk) {
812                 qpc->pri_path.feup |= MLX4_FSM_FORCE_ETH_SRC_MAC;
813                 qpc->pri_path.grh_mylmc = (0x80 & qpc->pri_path.grh_mylmc) + vp_oper->mac_idx;
814         }
815 out:
816         return err;
817 }
818
819 static int mpt_mask(struct mlx4_dev *dev)
820 {
821         return dev->caps.num_mpts - 1;
822 }
823
824 static void *find_res(struct mlx4_dev *dev, u64 res_id,
825                       enum mlx4_resource type)
826 {
827         struct mlx4_priv *priv = mlx4_priv(dev);
828
829         return res_tracker_lookup(&priv->mfunc.master.res_tracker.res_tree[type],
830                                   res_id);
831 }
832
833 static int get_res(struct mlx4_dev *dev, int slave, u64 res_id,
834                    enum mlx4_resource type,
835                    void *res)
836 {
837         struct res_common *r;
838         int err = 0;
839
840         spin_lock_irq(mlx4_tlock(dev));
841         r = find_res(dev, res_id, type);
842         if (!r) {
843                 err = -ENONET;
844                 goto exit;
845         }
846
847         if (r->state == RES_ANY_BUSY) {
848                 err = -EBUSY;
849                 goto exit;
850         }
851
852         if (r->owner != slave) {
853                 err = -EPERM;
854                 goto exit;
855         }
856
857         r->from_state = r->state;
858         r->state = RES_ANY_BUSY;
859
860         if (res)
861                 *((struct res_common **)res) = r;
862
863 exit:
864         spin_unlock_irq(mlx4_tlock(dev));
865         return err;
866 }
867
868 int mlx4_get_slave_from_resource_id(struct mlx4_dev *dev,
869                                     enum mlx4_resource type,
870                                     u64 res_id, int *slave)
871 {
872
873         struct res_common *r;
874         int err = -ENOENT;
875         int id = res_id;
876
877         if (type == RES_QP)
878                 id &= 0x7fffff;
879         spin_lock(mlx4_tlock(dev));
880
881         r = find_res(dev, id, type);
882         if (r) {
883                 *slave = r->owner;
884                 err = 0;
885         }
886         spin_unlock(mlx4_tlock(dev));
887
888         return err;
889 }
890
891 static void put_res(struct mlx4_dev *dev, int slave, u64 res_id,
892                     enum mlx4_resource type)
893 {
894         struct res_common *r;
895
896         spin_lock_irq(mlx4_tlock(dev));
897         r = find_res(dev, res_id, type);
898         if (r)
899                 r->state = r->from_state;
900         spin_unlock_irq(mlx4_tlock(dev));
901 }
902
903 static int counter_alloc_res(struct mlx4_dev *dev, int slave, int op, int cmd,
904                              u64 in_param, u64 *out_param, int port);
905
906 static int handle_existing_counter(struct mlx4_dev *dev, u8 slave, int port,
907                                    int counter_index)
908 {
909         struct res_common *r;
910         struct res_counter *counter;
911         int ret = 0;
912
913         if (counter_index == MLX4_SINK_COUNTER_INDEX(dev))
914                 return ret;
915
916         spin_lock_irq(mlx4_tlock(dev));
917         r = find_res(dev, counter_index, RES_COUNTER);
918         if (!r || r->owner != slave) {
919                 ret = -EINVAL;
920         } else {
921                 counter = container_of(r, struct res_counter, com);
922                 if (!counter->port)
923                         counter->port = port;
924         }
925
926         spin_unlock_irq(mlx4_tlock(dev));
927         return ret;
928 }
929
930 static int handle_unexisting_counter(struct mlx4_dev *dev,
931                                      struct mlx4_qp_context *qpc, u8 slave,
932                                      int port)
933 {
934         struct mlx4_priv *priv = mlx4_priv(dev);
935         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
936         struct res_common *tmp;
937         struct res_counter *counter;
938         u64 counter_idx = MLX4_SINK_COUNTER_INDEX(dev);
939         int err = 0;
940
941         spin_lock_irq(mlx4_tlock(dev));
942         list_for_each_entry(tmp,
943                             &tracker->slave_list[slave].res_list[RES_COUNTER],
944                             list) {
945                 counter = container_of(tmp, struct res_counter, com);
946                 if (port == counter->port) {
947                         qpc->pri_path.counter_index  = counter->com.res_id;
948                         spin_unlock_irq(mlx4_tlock(dev));
949                         return 0;
950                 }
951         }
952         spin_unlock_irq(mlx4_tlock(dev));
953
954         /* No existing counter, need to allocate a new counter */
955         err = counter_alloc_res(dev, slave, RES_OP_RESERVE, 0, 0, &counter_idx,
956                                 port);
957         if (err == -ENOENT) {
958                 err = 0;
959         } else if (err && err != -ENOSPC) {
960                 mlx4_err(dev, "%s: failed to create new counter for slave %d err %d\n",
961                          __func__, slave, err);
962         } else {
963                 qpc->pri_path.counter_index = counter_idx;
964                 mlx4_dbg(dev, "%s: alloc new counter for slave %d index %d\n",
965                          __func__, slave, qpc->pri_path.counter_index);
966                 err = 0;
967         }
968
969         return err;
970 }
971
972 static int handle_counter(struct mlx4_dev *dev, struct mlx4_qp_context *qpc,
973                           u8 slave, int port)
974 {
975         if (qpc->pri_path.counter_index != MLX4_SINK_COUNTER_INDEX(dev))
976                 return handle_existing_counter(dev, slave, port,
977                                                qpc->pri_path.counter_index);
978
979         return handle_unexisting_counter(dev, qpc, slave, port);
980 }
981
982 static struct res_common *alloc_qp_tr(int id)
983 {
984         struct res_qp *ret;
985
986         ret = kzalloc(sizeof *ret, GFP_KERNEL);
987         if (!ret)
988                 return NULL;
989
990         ret->com.res_id = id;
991         ret->com.state = RES_QP_RESERVED;
992         ret->local_qpn = id;
993         INIT_LIST_HEAD(&ret->mcg_list);
994         spin_lock_init(&ret->mcg_spl);
995         atomic_set(&ret->ref_count, 0);
996
997         return &ret->com;
998 }
999
1000 static struct res_common *alloc_mtt_tr(int id, int order)
1001 {
1002         struct res_mtt *ret;
1003
1004         ret = kzalloc(sizeof *ret, GFP_KERNEL);
1005         if (!ret)
1006                 return NULL;
1007
1008         ret->com.res_id = id;
1009         ret->order = order;
1010         ret->com.state = RES_MTT_ALLOCATED;
1011         atomic_set(&ret->ref_count, 0);
1012
1013         return &ret->com;
1014 }
1015
1016 static struct res_common *alloc_mpt_tr(int id, int key)
1017 {
1018         struct res_mpt *ret;
1019
1020         ret = kzalloc(sizeof *ret, GFP_KERNEL);
1021         if (!ret)
1022                 return NULL;
1023
1024         ret->com.res_id = id;
1025         ret->com.state = RES_MPT_RESERVED;
1026         ret->key = key;
1027
1028         return &ret->com;
1029 }
1030
1031 static struct res_common *alloc_eq_tr(int id)
1032 {
1033         struct res_eq *ret;
1034
1035         ret = kzalloc(sizeof *ret, GFP_KERNEL);
1036         if (!ret)
1037                 return NULL;
1038
1039         ret->com.res_id = id;
1040         ret->com.state = RES_EQ_RESERVED;
1041
1042         return &ret->com;
1043 }
1044
1045 static struct res_common *alloc_cq_tr(int id)
1046 {
1047         struct res_cq *ret;
1048
1049         ret = kzalloc(sizeof *ret, GFP_KERNEL);
1050         if (!ret)
1051                 return NULL;
1052
1053         ret->com.res_id = id;
1054         ret->com.state = RES_CQ_ALLOCATED;
1055         atomic_set(&ret->ref_count, 0);
1056
1057         return &ret->com;
1058 }
1059
1060 static struct res_common *alloc_srq_tr(int id)
1061 {
1062         struct res_srq *ret;
1063
1064         ret = kzalloc(sizeof *ret, GFP_KERNEL);
1065         if (!ret)
1066                 return NULL;
1067
1068         ret->com.res_id = id;
1069         ret->com.state = RES_SRQ_ALLOCATED;
1070         atomic_set(&ret->ref_count, 0);
1071
1072         return &ret->com;
1073 }
1074
1075 static struct res_common *alloc_counter_tr(int id, int port)
1076 {
1077         struct res_counter *ret;
1078
1079         ret = kzalloc(sizeof *ret, GFP_KERNEL);
1080         if (!ret)
1081                 return NULL;
1082
1083         ret->com.res_id = id;
1084         ret->com.state = RES_COUNTER_ALLOCATED;
1085         ret->port = port;
1086
1087         return &ret->com;
1088 }
1089
1090 static struct res_common *alloc_xrcdn_tr(int id)
1091 {
1092         struct res_xrcdn *ret;
1093
1094         ret = kzalloc(sizeof *ret, GFP_KERNEL);
1095         if (!ret)
1096                 return NULL;
1097
1098         ret->com.res_id = id;
1099         ret->com.state = RES_XRCD_ALLOCATED;
1100
1101         return &ret->com;
1102 }
1103
1104 static struct res_common *alloc_fs_rule_tr(u64 id, int qpn)
1105 {
1106         struct res_fs_rule *ret;
1107
1108         ret = kzalloc(sizeof *ret, GFP_KERNEL);
1109         if (!ret)
1110                 return NULL;
1111
1112         ret->com.res_id = id;
1113         ret->com.state = RES_FS_RULE_ALLOCATED;
1114         ret->qpn = qpn;
1115         return &ret->com;
1116 }
1117
1118 static struct res_common *alloc_tr(u64 id, enum mlx4_resource type, int slave,
1119                                    int extra)
1120 {
1121         struct res_common *ret;
1122
1123         switch (type) {
1124         case RES_QP:
1125                 ret = alloc_qp_tr(id);
1126                 break;
1127         case RES_MPT:
1128                 ret = alloc_mpt_tr(id, extra);
1129                 break;
1130         case RES_MTT:
1131                 ret = alloc_mtt_tr(id, extra);
1132                 break;
1133         case RES_EQ:
1134                 ret = alloc_eq_tr(id);
1135                 break;
1136         case RES_CQ:
1137                 ret = alloc_cq_tr(id);
1138                 break;
1139         case RES_SRQ:
1140                 ret = alloc_srq_tr(id);
1141                 break;
1142         case RES_MAC:
1143                 pr_err("implementation missing\n");
1144                 return NULL;
1145         case RES_COUNTER:
1146                 ret = alloc_counter_tr(id, extra);
1147                 break;
1148         case RES_XRCD:
1149                 ret = alloc_xrcdn_tr(id);
1150                 break;
1151         case RES_FS_RULE:
1152                 ret = alloc_fs_rule_tr(id, extra);
1153                 break;
1154         default:
1155                 return NULL;
1156         }
1157         if (ret)
1158                 ret->owner = slave;
1159
1160         return ret;
1161 }
1162
1163 int mlx4_calc_vf_counters(struct mlx4_dev *dev, int slave, int port,
1164                           struct mlx4_counter *data)
1165 {
1166         struct mlx4_priv *priv = mlx4_priv(dev);
1167         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1168         struct res_common *tmp;
1169         struct res_counter *counter;
1170         int *counters_arr;
1171         int i = 0, err = 0;
1172
1173         memset(data, 0, sizeof(*data));
1174
1175         counters_arr = kmalloc_array(dev->caps.max_counters,
1176                                      sizeof(*counters_arr), GFP_KERNEL);
1177         if (!counters_arr)
1178                 return -ENOMEM;
1179
1180         spin_lock_irq(mlx4_tlock(dev));
1181         list_for_each_entry(tmp,
1182                             &tracker->slave_list[slave].res_list[RES_COUNTER],
1183                             list) {
1184                 counter = container_of(tmp, struct res_counter, com);
1185                 if (counter->port == port) {
1186                         counters_arr[i] = (int)tmp->res_id;
1187                         i++;
1188                 }
1189         }
1190         spin_unlock_irq(mlx4_tlock(dev));
1191         counters_arr[i] = -1;
1192
1193         i = 0;
1194
1195         while (counters_arr[i] != -1) {
1196                 err = mlx4_get_counter_stats(dev, counters_arr[i], data,
1197                                              0);
1198                 if (err) {
1199                         memset(data, 0, sizeof(*data));
1200                         goto table_changed;
1201                 }
1202                 i++;
1203         }
1204
1205 table_changed:
1206         kfree(counters_arr);
1207         return 0;
1208 }
1209
1210 static int add_res_range(struct mlx4_dev *dev, int slave, u64 base, int count,
1211                          enum mlx4_resource type, int extra)
1212 {
1213         int i;
1214         int err;
1215         struct mlx4_priv *priv = mlx4_priv(dev);
1216         struct res_common **res_arr;
1217         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1218         struct rb_root *root = &tracker->res_tree[type];
1219
1220         res_arr = kzalloc(count * sizeof *res_arr, GFP_KERNEL);
1221         if (!res_arr)
1222                 return -ENOMEM;
1223
1224         for (i = 0; i < count; ++i) {
1225                 res_arr[i] = alloc_tr(base + i, type, slave, extra);
1226                 if (!res_arr[i]) {
1227                         for (--i; i >= 0; --i)
1228                                 kfree(res_arr[i]);
1229
1230                         kfree(res_arr);
1231                         return -ENOMEM;
1232                 }
1233         }
1234
1235         spin_lock_irq(mlx4_tlock(dev));
1236         for (i = 0; i < count; ++i) {
1237                 if (find_res(dev, base + i, type)) {
1238                         err = -EEXIST;
1239                         goto undo;
1240                 }
1241                 err = res_tracker_insert(root, res_arr[i]);
1242                 if (err)
1243                         goto undo;
1244                 list_add_tail(&res_arr[i]->list,
1245                               &tracker->slave_list[slave].res_list[type]);
1246         }
1247         spin_unlock_irq(mlx4_tlock(dev));
1248         kfree(res_arr);
1249
1250         return 0;
1251
1252 undo:
1253         for (--i; i >= 0; --i) {
1254                 rb_erase(&res_arr[i]->node, root);
1255                 list_del_init(&res_arr[i]->list);
1256         }
1257
1258         spin_unlock_irq(mlx4_tlock(dev));
1259
1260         for (i = 0; i < count; ++i)
1261                 kfree(res_arr[i]);
1262
1263         kfree(res_arr);
1264
1265         return err;
1266 }
1267
1268 static int remove_qp_ok(struct res_qp *res)
1269 {
1270         if (res->com.state == RES_QP_BUSY || atomic_read(&res->ref_count) ||
1271             !list_empty(&res->mcg_list)) {
1272                 pr_err("resource tracker: fail to remove qp, state %d, ref_count %d\n",
1273                        res->com.state, atomic_read(&res->ref_count));
1274                 return -EBUSY;
1275         } else if (res->com.state != RES_QP_RESERVED) {
1276                 return -EPERM;
1277         }
1278
1279         return 0;
1280 }
1281
1282 static int remove_mtt_ok(struct res_mtt *res, int order)
1283 {
1284         if (res->com.state == RES_MTT_BUSY ||
1285             atomic_read(&res->ref_count)) {
1286                 pr_devel("%s-%d: state %s, ref_count %d\n",
1287                          __func__, __LINE__,
1288                          mtt_states_str(res->com.state),
1289                          atomic_read(&res->ref_count));
1290                 return -EBUSY;
1291         } else if (res->com.state != RES_MTT_ALLOCATED)
1292                 return -EPERM;
1293         else if (res->order != order)
1294                 return -EINVAL;
1295
1296         return 0;
1297 }
1298
1299 static int remove_mpt_ok(struct res_mpt *res)
1300 {
1301         if (res->com.state == RES_MPT_BUSY)
1302                 return -EBUSY;
1303         else if (res->com.state != RES_MPT_RESERVED)
1304                 return -EPERM;
1305
1306         return 0;
1307 }
1308
1309 static int remove_eq_ok(struct res_eq *res)
1310 {
1311         if (res->com.state == RES_MPT_BUSY)
1312                 return -EBUSY;
1313         else if (res->com.state != RES_MPT_RESERVED)
1314                 return -EPERM;
1315
1316         return 0;
1317 }
1318
1319 static int remove_counter_ok(struct res_counter *res)
1320 {
1321         if (res->com.state == RES_COUNTER_BUSY)
1322                 return -EBUSY;
1323         else if (res->com.state != RES_COUNTER_ALLOCATED)
1324                 return -EPERM;
1325
1326         return 0;
1327 }
1328
1329 static int remove_xrcdn_ok(struct res_xrcdn *res)
1330 {
1331         if (res->com.state == RES_XRCD_BUSY)
1332                 return -EBUSY;
1333         else if (res->com.state != RES_XRCD_ALLOCATED)
1334                 return -EPERM;
1335
1336         return 0;
1337 }
1338
1339 static int remove_fs_rule_ok(struct res_fs_rule *res)
1340 {
1341         if (res->com.state == RES_FS_RULE_BUSY)
1342                 return -EBUSY;
1343         else if (res->com.state != RES_FS_RULE_ALLOCATED)
1344                 return -EPERM;
1345
1346         return 0;
1347 }
1348
1349 static int remove_cq_ok(struct res_cq *res)
1350 {
1351         if (res->com.state == RES_CQ_BUSY)
1352                 return -EBUSY;
1353         else if (res->com.state != RES_CQ_ALLOCATED)
1354                 return -EPERM;
1355
1356         return 0;
1357 }
1358
1359 static int remove_srq_ok(struct res_srq *res)
1360 {
1361         if (res->com.state == RES_SRQ_BUSY)
1362                 return -EBUSY;
1363         else if (res->com.state != RES_SRQ_ALLOCATED)
1364                 return -EPERM;
1365
1366         return 0;
1367 }
1368
1369 static int remove_ok(struct res_common *res, enum mlx4_resource type, int extra)
1370 {
1371         switch (type) {
1372         case RES_QP:
1373                 return remove_qp_ok((struct res_qp *)res);
1374         case RES_CQ:
1375                 return remove_cq_ok((struct res_cq *)res);
1376         case RES_SRQ:
1377                 return remove_srq_ok((struct res_srq *)res);
1378         case RES_MPT:
1379                 return remove_mpt_ok((struct res_mpt *)res);
1380         case RES_MTT:
1381                 return remove_mtt_ok((struct res_mtt *)res, extra);
1382         case RES_MAC:
1383                 return -ENOSYS;
1384         case RES_EQ:
1385                 return remove_eq_ok((struct res_eq *)res);
1386         case RES_COUNTER:
1387                 return remove_counter_ok((struct res_counter *)res);
1388         case RES_XRCD:
1389                 return remove_xrcdn_ok((struct res_xrcdn *)res);
1390         case RES_FS_RULE:
1391                 return remove_fs_rule_ok((struct res_fs_rule *)res);
1392         default:
1393                 return -EINVAL;
1394         }
1395 }
1396
1397 static int rem_res_range(struct mlx4_dev *dev, int slave, u64 base, int count,
1398                          enum mlx4_resource type, int extra)
1399 {
1400         u64 i;
1401         int err;
1402         struct mlx4_priv *priv = mlx4_priv(dev);
1403         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1404         struct res_common *r;
1405
1406         spin_lock_irq(mlx4_tlock(dev));
1407         for (i = base; i < base + count; ++i) {
1408                 r = res_tracker_lookup(&tracker->res_tree[type], i);
1409                 if (!r) {
1410                         err = -ENOENT;
1411                         goto out;
1412                 }
1413                 if (r->owner != slave) {
1414                         err = -EPERM;
1415                         goto out;
1416                 }
1417                 err = remove_ok(r, type, extra);
1418                 if (err)
1419                         goto out;
1420         }
1421
1422         for (i = base; i < base + count; ++i) {
1423                 r = res_tracker_lookup(&tracker->res_tree[type], i);
1424                 rb_erase(&r->node, &tracker->res_tree[type]);
1425                 list_del(&r->list);
1426                 kfree(r);
1427         }
1428         err = 0;
1429
1430 out:
1431         spin_unlock_irq(mlx4_tlock(dev));
1432
1433         return err;
1434 }
1435
1436 static int qp_res_start_move_to(struct mlx4_dev *dev, int slave, int qpn,
1437                                 enum res_qp_states state, struct res_qp **qp,
1438                                 int alloc)
1439 {
1440         struct mlx4_priv *priv = mlx4_priv(dev);
1441         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1442         struct res_qp *r;
1443         int err = 0;
1444
1445         spin_lock_irq(mlx4_tlock(dev));
1446         r = res_tracker_lookup(&tracker->res_tree[RES_QP], qpn);
1447         if (!r)
1448                 err = -ENOENT;
1449         else if (r->com.owner != slave)
1450                 err = -EPERM;
1451         else {
1452                 switch (state) {
1453                 case RES_QP_BUSY:
1454                         mlx4_dbg(dev, "%s: failed RES_QP, 0x%llx\n",
1455                                  __func__, r->com.res_id);
1456                         err = -EBUSY;
1457                         break;
1458
1459                 case RES_QP_RESERVED:
1460                         if (r->com.state == RES_QP_MAPPED && !alloc)
1461                                 break;
1462
1463                         mlx4_dbg(dev, "failed RES_QP, 0x%llx\n", r->com.res_id);
1464                         err = -EINVAL;
1465                         break;
1466
1467                 case RES_QP_MAPPED:
1468                         if ((r->com.state == RES_QP_RESERVED && alloc) ||
1469                             r->com.state == RES_QP_HW)
1470                                 break;
1471                         else {
1472                                 mlx4_dbg(dev, "failed RES_QP, 0x%llx\n",
1473                                           r->com.res_id);
1474                                 err = -EINVAL;
1475                         }
1476
1477                         break;
1478
1479                 case RES_QP_HW:
1480                         if (r->com.state != RES_QP_MAPPED)
1481                                 err = -EINVAL;
1482                         break;
1483                 default:
1484                         err = -EINVAL;
1485                 }
1486
1487                 if (!err) {
1488                         r->com.from_state = r->com.state;
1489                         r->com.to_state = state;
1490                         r->com.state = RES_QP_BUSY;
1491                         if (qp)
1492                                 *qp = r;
1493                 }
1494         }
1495
1496         spin_unlock_irq(mlx4_tlock(dev));
1497
1498         return err;
1499 }
1500
1501 static int mr_res_start_move_to(struct mlx4_dev *dev, int slave, int index,
1502                                 enum res_mpt_states state, struct res_mpt **mpt)
1503 {
1504         struct mlx4_priv *priv = mlx4_priv(dev);
1505         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1506         struct res_mpt *r;
1507         int err = 0;
1508
1509         spin_lock_irq(mlx4_tlock(dev));
1510         r = res_tracker_lookup(&tracker->res_tree[RES_MPT], index);
1511         if (!r)
1512                 err = -ENOENT;
1513         else if (r->com.owner != slave)
1514                 err = -EPERM;
1515         else {
1516                 switch (state) {
1517                 case RES_MPT_BUSY:
1518                         err = -EINVAL;
1519                         break;
1520
1521                 case RES_MPT_RESERVED:
1522                         if (r->com.state != RES_MPT_MAPPED)
1523                                 err = -EINVAL;
1524                         break;
1525
1526                 case RES_MPT_MAPPED:
1527                         if (r->com.state != RES_MPT_RESERVED &&
1528                             r->com.state != RES_MPT_HW)
1529                                 err = -EINVAL;
1530                         break;
1531
1532                 case RES_MPT_HW:
1533                         if (r->com.state != RES_MPT_MAPPED)
1534                                 err = -EINVAL;
1535                         break;
1536                 default:
1537                         err = -EINVAL;
1538                 }
1539
1540                 if (!err) {
1541                         r->com.from_state = r->com.state;
1542                         r->com.to_state = state;
1543                         r->com.state = RES_MPT_BUSY;
1544                         if (mpt)
1545                                 *mpt = r;
1546                 }
1547         }
1548
1549         spin_unlock_irq(mlx4_tlock(dev));
1550
1551         return err;
1552 }
1553
1554 static int eq_res_start_move_to(struct mlx4_dev *dev, int slave, int index,
1555                                 enum res_eq_states state, struct res_eq **eq)
1556 {
1557         struct mlx4_priv *priv = mlx4_priv(dev);
1558         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1559         struct res_eq *r;
1560         int err = 0;
1561
1562         spin_lock_irq(mlx4_tlock(dev));
1563         r = res_tracker_lookup(&tracker->res_tree[RES_EQ], index);
1564         if (!r)
1565                 err = -ENOENT;
1566         else if (r->com.owner != slave)
1567                 err = -EPERM;
1568         else {
1569                 switch (state) {
1570                 case RES_EQ_BUSY:
1571                         err = -EINVAL;
1572                         break;
1573
1574                 case RES_EQ_RESERVED:
1575                         if (r->com.state != RES_EQ_HW)
1576                                 err = -EINVAL;
1577                         break;
1578
1579                 case RES_EQ_HW:
1580                         if (r->com.state != RES_EQ_RESERVED)
1581                                 err = -EINVAL;
1582                         break;
1583
1584                 default:
1585                         err = -EINVAL;
1586                 }
1587
1588                 if (!err) {
1589                         r->com.from_state = r->com.state;
1590                         r->com.to_state = state;
1591                         r->com.state = RES_EQ_BUSY;
1592                         if (eq)
1593                                 *eq = r;
1594                 }
1595         }
1596
1597         spin_unlock_irq(mlx4_tlock(dev));
1598
1599         return err;
1600 }
1601
1602 static int cq_res_start_move_to(struct mlx4_dev *dev, int slave, int cqn,
1603                                 enum res_cq_states state, struct res_cq **cq)
1604 {
1605         struct mlx4_priv *priv = mlx4_priv(dev);
1606         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1607         struct res_cq *r;
1608         int err;
1609
1610         spin_lock_irq(mlx4_tlock(dev));
1611         r = res_tracker_lookup(&tracker->res_tree[RES_CQ], cqn);
1612         if (!r) {
1613                 err = -ENOENT;
1614         } else if (r->com.owner != slave) {
1615                 err = -EPERM;
1616         } else if (state == RES_CQ_ALLOCATED) {
1617                 if (r->com.state != RES_CQ_HW)
1618                         err = -EINVAL;
1619                 else if (atomic_read(&r->ref_count))
1620                         err = -EBUSY;
1621                 else
1622                         err = 0;
1623         } else if (state != RES_CQ_HW || r->com.state != RES_CQ_ALLOCATED) {
1624                 err = -EINVAL;
1625         } else {
1626                 err = 0;
1627         }
1628
1629         if (!err) {
1630                 r->com.from_state = r->com.state;
1631                 r->com.to_state = state;
1632                 r->com.state = RES_CQ_BUSY;
1633                 if (cq)
1634                         *cq = r;
1635         }
1636
1637         spin_unlock_irq(mlx4_tlock(dev));
1638
1639         return err;
1640 }
1641
1642 static int srq_res_start_move_to(struct mlx4_dev *dev, int slave, int index,
1643                                  enum res_srq_states state, struct res_srq **srq)
1644 {
1645         struct mlx4_priv *priv = mlx4_priv(dev);
1646         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1647         struct res_srq *r;
1648         int err = 0;
1649
1650         spin_lock_irq(mlx4_tlock(dev));
1651         r = res_tracker_lookup(&tracker->res_tree[RES_SRQ], index);
1652         if (!r) {
1653                 err = -ENOENT;
1654         } else if (r->com.owner != slave) {
1655                 err = -EPERM;
1656         } else if (state == RES_SRQ_ALLOCATED) {
1657                 if (r->com.state != RES_SRQ_HW)
1658                         err = -EINVAL;
1659                 else if (atomic_read(&r->ref_count))
1660                         err = -EBUSY;
1661         } else if (state != RES_SRQ_HW || r->com.state != RES_SRQ_ALLOCATED) {
1662                 err = -EINVAL;
1663         }
1664
1665         if (!err) {
1666                 r->com.from_state = r->com.state;
1667                 r->com.to_state = state;
1668                 r->com.state = RES_SRQ_BUSY;
1669                 if (srq)
1670                         *srq = r;
1671         }
1672
1673         spin_unlock_irq(mlx4_tlock(dev));
1674
1675         return err;
1676 }
1677
1678 static void res_abort_move(struct mlx4_dev *dev, int slave,
1679                            enum mlx4_resource type, int id)
1680 {
1681         struct mlx4_priv *priv = mlx4_priv(dev);
1682         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1683         struct res_common *r;
1684
1685         spin_lock_irq(mlx4_tlock(dev));
1686         r = res_tracker_lookup(&tracker->res_tree[type], id);
1687         if (r && (r->owner == slave))
1688                 r->state = r->from_state;
1689         spin_unlock_irq(mlx4_tlock(dev));
1690 }
1691
1692 static void res_end_move(struct mlx4_dev *dev, int slave,
1693                          enum mlx4_resource type, int id)
1694 {
1695         struct mlx4_priv *priv = mlx4_priv(dev);
1696         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1697         struct res_common *r;
1698
1699         spin_lock_irq(mlx4_tlock(dev));
1700         r = res_tracker_lookup(&tracker->res_tree[type], id);
1701         if (r && (r->owner == slave))
1702                 r->state = r->to_state;
1703         spin_unlock_irq(mlx4_tlock(dev));
1704 }
1705
1706 static int valid_reserved(struct mlx4_dev *dev, int slave, int qpn)
1707 {
1708         return mlx4_is_qp_reserved(dev, qpn) &&
1709                 (mlx4_is_master(dev) || mlx4_is_guest_proxy(dev, slave, qpn));
1710 }
1711
1712 static int fw_reserved(struct mlx4_dev *dev, int qpn)
1713 {
1714         return qpn < dev->caps.reserved_qps_cnt[MLX4_QP_REGION_FW];
1715 }
1716
1717 static int qp_alloc_res(struct mlx4_dev *dev, int slave, int op, int cmd,
1718                         u64 in_param, u64 *out_param)
1719 {
1720         int err;
1721         int count;
1722         int align;
1723         int base;
1724         int qpn;
1725         u8 flags;
1726
1727         switch (op) {
1728         case RES_OP_RESERVE:
1729                 count = get_param_l(&in_param) & 0xffffff;
1730                 /* Turn off all unsupported QP allocation flags that the
1731                  * slave tries to set.
1732                  */
1733                 flags = (get_param_l(&in_param) >> 24) & dev->caps.alloc_res_qp_mask;
1734                 align = get_param_h(&in_param);
1735                 err = mlx4_grant_resource(dev, slave, RES_QP, count, 0);
1736                 if (err)
1737                         return err;
1738
1739                 err = __mlx4_qp_reserve_range(dev, count, align, &base, flags);
1740                 if (err) {
1741                         mlx4_release_resource(dev, slave, RES_QP, count, 0);
1742                         return err;
1743                 }
1744
1745                 err = add_res_range(dev, slave, base, count, RES_QP, 0);
1746                 if (err) {
1747                         mlx4_release_resource(dev, slave, RES_QP, count, 0);
1748                         __mlx4_qp_release_range(dev, base, count);
1749                         return err;
1750                 }
1751                 set_param_l(out_param, base);
1752                 break;
1753         case RES_OP_MAP_ICM:
1754                 qpn = get_param_l(&in_param) & 0x7fffff;
1755                 if (valid_reserved(dev, slave, qpn)) {
1756                         err = add_res_range(dev, slave, qpn, 1, RES_QP, 0);
1757                         if (err)
1758                                 return err;
1759                 }
1760
1761                 err = qp_res_start_move_to(dev, slave, qpn, RES_QP_MAPPED,
1762                                            NULL, 1);
1763                 if (err)
1764                         return err;
1765
1766                 if (!fw_reserved(dev, qpn)) {
1767                         err = __mlx4_qp_alloc_icm(dev, qpn, GFP_KERNEL);
1768                         if (err) {
1769                                 res_abort_move(dev, slave, RES_QP, qpn);
1770                                 return err;
1771                         }
1772                 }
1773
1774                 res_end_move(dev, slave, RES_QP, qpn);
1775                 break;
1776
1777         default:
1778                 err = -EINVAL;
1779                 break;
1780         }
1781         return err;
1782 }
1783
1784 static int mtt_alloc_res(struct mlx4_dev *dev, int slave, int op, int cmd,
1785                          u64 in_param, u64 *out_param)
1786 {
1787         int err = -EINVAL;
1788         int base;
1789         int order;
1790
1791         if (op != RES_OP_RESERVE_AND_MAP)
1792                 return err;
1793
1794         order = get_param_l(&in_param);
1795
1796         err = mlx4_grant_resource(dev, slave, RES_MTT, 1 << order, 0);
1797         if (err)
1798                 return err;
1799
1800         base = __mlx4_alloc_mtt_range(dev, order);
1801         if (base == -1) {
1802                 mlx4_release_resource(dev, slave, RES_MTT, 1 << order, 0);
1803                 return -ENOMEM;
1804         }
1805
1806         err = add_res_range(dev, slave, base, 1, RES_MTT, order);
1807         if (err) {
1808                 mlx4_release_resource(dev, slave, RES_MTT, 1 << order, 0);
1809                 __mlx4_free_mtt_range(dev, base, order);
1810         } else {
1811                 set_param_l(out_param, base);
1812         }
1813
1814         return err;
1815 }
1816
1817 static int mpt_alloc_res(struct mlx4_dev *dev, int slave, int op, int cmd,
1818                          u64 in_param, u64 *out_param)
1819 {
1820         int err = -EINVAL;
1821         int index;
1822         int id;
1823         struct res_mpt *mpt;
1824
1825         switch (op) {
1826         case RES_OP_RESERVE:
1827                 err = mlx4_grant_resource(dev, slave, RES_MPT, 1, 0);
1828                 if (err)
1829                         break;
1830
1831                 index = __mlx4_mpt_reserve(dev);
1832                 if (index == -1) {
1833                         mlx4_release_resource(dev, slave, RES_MPT, 1, 0);
1834                         break;
1835                 }
1836                 id = index & mpt_mask(dev);
1837
1838                 err = add_res_range(dev, slave, id, 1, RES_MPT, index);
1839                 if (err) {
1840                         mlx4_release_resource(dev, slave, RES_MPT, 1, 0);
1841                         __mlx4_mpt_release(dev, index);
1842                         break;
1843                 }
1844                 set_param_l(out_param, index);
1845                 break;
1846         case RES_OP_MAP_ICM:
1847                 index = get_param_l(&in_param);
1848                 id = index & mpt_mask(dev);
1849                 err = mr_res_start_move_to(dev, slave, id,
1850                                            RES_MPT_MAPPED, &mpt);
1851                 if (err)
1852                         return err;
1853
1854                 err = __mlx4_mpt_alloc_icm(dev, mpt->key, GFP_KERNEL);
1855                 if (err) {
1856                         res_abort_move(dev, slave, RES_MPT, id);
1857                         return err;
1858                 }
1859
1860                 res_end_move(dev, slave, RES_MPT, id);
1861                 break;
1862         }
1863         return err;
1864 }
1865
1866 static int cq_alloc_res(struct mlx4_dev *dev, int slave, int op, int cmd,
1867                         u64 in_param, u64 *out_param)
1868 {
1869         int cqn;
1870         int err;
1871
1872         switch (op) {
1873         case RES_OP_RESERVE_AND_MAP:
1874                 err = mlx4_grant_resource(dev, slave, RES_CQ, 1, 0);
1875                 if (err)
1876                         break;
1877
1878                 err = __mlx4_cq_alloc_icm(dev, &cqn);
1879                 if (err) {
1880                         mlx4_release_resource(dev, slave, RES_CQ, 1, 0);
1881                         break;
1882                 }
1883
1884                 err = add_res_range(dev, slave, cqn, 1, RES_CQ, 0);
1885                 if (err) {
1886                         mlx4_release_resource(dev, slave, RES_CQ, 1, 0);
1887                         __mlx4_cq_free_icm(dev, cqn);
1888                         break;
1889                 }
1890
1891                 set_param_l(out_param, cqn);
1892                 break;
1893
1894         default:
1895                 err = -EINVAL;
1896         }
1897
1898         return err;
1899 }
1900
1901 static int srq_alloc_res(struct mlx4_dev *dev, int slave, int op, int cmd,
1902                          u64 in_param, u64 *out_param)
1903 {
1904         int srqn;
1905         int err;
1906
1907         switch (op) {
1908         case RES_OP_RESERVE_AND_MAP:
1909                 err = mlx4_grant_resource(dev, slave, RES_SRQ, 1, 0);
1910                 if (err)
1911                         break;
1912
1913                 err = __mlx4_srq_alloc_icm(dev, &srqn);
1914                 if (err) {
1915                         mlx4_release_resource(dev, slave, RES_SRQ, 1, 0);
1916                         break;
1917                 }
1918
1919                 err = add_res_range(dev, slave, srqn, 1, RES_SRQ, 0);
1920                 if (err) {
1921                         mlx4_release_resource(dev, slave, RES_SRQ, 1, 0);
1922                         __mlx4_srq_free_icm(dev, srqn);
1923                         break;
1924                 }
1925
1926                 set_param_l(out_param, srqn);
1927                 break;
1928
1929         default:
1930                 err = -EINVAL;
1931         }
1932
1933         return err;
1934 }
1935
1936 static int mac_find_smac_ix_in_slave(struct mlx4_dev *dev, int slave, int port,
1937                                      u8 smac_index, u64 *mac)
1938 {
1939         struct mlx4_priv *priv = mlx4_priv(dev);
1940         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1941         struct list_head *mac_list =
1942                 &tracker->slave_list[slave].res_list[RES_MAC];
1943         struct mac_res *res, *tmp;
1944
1945         list_for_each_entry_safe(res, tmp, mac_list, list) {
1946                 if (res->smac_index == smac_index && res->port == (u8) port) {
1947                         *mac = res->mac;
1948                         return 0;
1949                 }
1950         }
1951         return -ENOENT;
1952 }
1953
1954 static int mac_add_to_slave(struct mlx4_dev *dev, int slave, u64 mac, int port, u8 smac_index)
1955 {
1956         struct mlx4_priv *priv = mlx4_priv(dev);
1957         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1958         struct list_head *mac_list =
1959                 &tracker->slave_list[slave].res_list[RES_MAC];
1960         struct mac_res *res, *tmp;
1961
1962         list_for_each_entry_safe(res, tmp, mac_list, list) {
1963                 if (res->mac == mac && res->port == (u8) port) {
1964                         /* mac found. update ref count */
1965                         ++res->ref_count;
1966                         return 0;
1967                 }
1968         }
1969
1970         if (mlx4_grant_resource(dev, slave, RES_MAC, 1, port))
1971                 return -EINVAL;
1972         res = kzalloc(sizeof *res, GFP_KERNEL);
1973         if (!res) {
1974                 mlx4_release_resource(dev, slave, RES_MAC, 1, port);
1975                 return -ENOMEM;
1976         }
1977         res->mac = mac;
1978         res->port = (u8) port;
1979         res->smac_index = smac_index;
1980         res->ref_count = 1;
1981         list_add_tail(&res->list,
1982                       &tracker->slave_list[slave].res_list[RES_MAC]);
1983         return 0;
1984 }
1985
1986 static void mac_del_from_slave(struct mlx4_dev *dev, int slave, u64 mac,
1987                                int port)
1988 {
1989         struct mlx4_priv *priv = mlx4_priv(dev);
1990         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
1991         struct list_head *mac_list =
1992                 &tracker->slave_list[slave].res_list[RES_MAC];
1993         struct mac_res *res, *tmp;
1994
1995         list_for_each_entry_safe(res, tmp, mac_list, list) {
1996                 if (res->mac == mac && res->port == (u8) port) {
1997                         if (!--res->ref_count) {
1998                                 list_del(&res->list);
1999                                 mlx4_release_resource(dev, slave, RES_MAC, 1, port);
2000                                 kfree(res);
2001                         }
2002                         break;
2003                 }
2004         }
2005 }
2006
2007 static void rem_slave_macs(struct mlx4_dev *dev, int slave)
2008 {
2009         struct mlx4_priv *priv = mlx4_priv(dev);
2010         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
2011         struct list_head *mac_list =
2012                 &tracker->slave_list[slave].res_list[RES_MAC];
2013         struct mac_res *res, *tmp;
2014         int i;
2015
2016         list_for_each_entry_safe(res, tmp, mac_list, list) {
2017                 list_del(&res->list);
2018                 /* dereference the mac the num times the slave referenced it */
2019                 for (i = 0; i < res->ref_count; i++)
2020                         __mlx4_unregister_mac(dev, res->port, res->mac);
2021                 mlx4_release_resource(dev, slave, RES_MAC, 1, res->port);
2022                 kfree(res);
2023         }
2024 }
2025
2026 static int mac_alloc_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2027                          u64 in_param, u64 *out_param, int in_port)
2028 {
2029         int err = -EINVAL;
2030         int port;
2031         u64 mac;
2032         u8 smac_index;
2033
2034         if (op != RES_OP_RESERVE_AND_MAP)
2035                 return err;
2036
2037         port = !in_port ? get_param_l(out_param) : in_port;
2038         port = mlx4_slave_convert_port(
2039                         dev, slave, port);
2040
2041         if (port < 0)
2042                 return -EINVAL;
2043         mac = in_param;
2044
2045         err = __mlx4_register_mac(dev, port, mac);
2046         if (err >= 0) {
2047                 smac_index = err;
2048                 set_param_l(out_param, err);
2049                 err = 0;
2050         }
2051
2052         if (!err) {
2053                 err = mac_add_to_slave(dev, slave, mac, port, smac_index);
2054                 if (err)
2055                         __mlx4_unregister_mac(dev, port, mac);
2056         }
2057         return err;
2058 }
2059
2060 static int vlan_add_to_slave(struct mlx4_dev *dev, int slave, u16 vlan,
2061                              int port, int vlan_index)
2062 {
2063         struct mlx4_priv *priv = mlx4_priv(dev);
2064         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
2065         struct list_head *vlan_list =
2066                 &tracker->slave_list[slave].res_list[RES_VLAN];
2067         struct vlan_res *res, *tmp;
2068
2069         list_for_each_entry_safe(res, tmp, vlan_list, list) {
2070                 if (res->vlan == vlan && res->port == (u8) port) {
2071                         /* vlan found. update ref count */
2072                         ++res->ref_count;
2073                         return 0;
2074                 }
2075         }
2076
2077         if (mlx4_grant_resource(dev, slave, RES_VLAN, 1, port))
2078                 return -EINVAL;
2079         res = kzalloc(sizeof(*res), GFP_KERNEL);
2080         if (!res) {
2081                 mlx4_release_resource(dev, slave, RES_VLAN, 1, port);
2082                 return -ENOMEM;
2083         }
2084         res->vlan = vlan;
2085         res->port = (u8) port;
2086         res->vlan_index = vlan_index;
2087         res->ref_count = 1;
2088         list_add_tail(&res->list,
2089                       &tracker->slave_list[slave].res_list[RES_VLAN]);
2090         return 0;
2091 }
2092
2093
2094 static void vlan_del_from_slave(struct mlx4_dev *dev, int slave, u16 vlan,
2095                                 int port)
2096 {
2097         struct mlx4_priv *priv = mlx4_priv(dev);
2098         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
2099         struct list_head *vlan_list =
2100                 &tracker->slave_list[slave].res_list[RES_VLAN];
2101         struct vlan_res *res, *tmp;
2102
2103         list_for_each_entry_safe(res, tmp, vlan_list, list) {
2104                 if (res->vlan == vlan && res->port == (u8) port) {
2105                         if (!--res->ref_count) {
2106                                 list_del(&res->list);
2107                                 mlx4_release_resource(dev, slave, RES_VLAN,
2108                                                       1, port);
2109                                 kfree(res);
2110                         }
2111                         break;
2112                 }
2113         }
2114 }
2115
2116 static void rem_slave_vlans(struct mlx4_dev *dev, int slave)
2117 {
2118         struct mlx4_priv *priv = mlx4_priv(dev);
2119         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
2120         struct list_head *vlan_list =
2121                 &tracker->slave_list[slave].res_list[RES_VLAN];
2122         struct vlan_res *res, *tmp;
2123         int i;
2124
2125         list_for_each_entry_safe(res, tmp, vlan_list, list) {
2126                 list_del(&res->list);
2127                 /* dereference the vlan the num times the slave referenced it */
2128                 for (i = 0; i < res->ref_count; i++)
2129                         __mlx4_unregister_vlan(dev, res->port, res->vlan);
2130                 mlx4_release_resource(dev, slave, RES_VLAN, 1, res->port);
2131                 kfree(res);
2132         }
2133 }
2134
2135 static int vlan_alloc_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2136                           u64 in_param, u64 *out_param, int in_port)
2137 {
2138         struct mlx4_priv *priv = mlx4_priv(dev);
2139         struct mlx4_slave_state *slave_state = priv->mfunc.master.slave_state;
2140         int err;
2141         u16 vlan;
2142         int vlan_index;
2143         int port;
2144
2145         port = !in_port ? get_param_l(out_param) : in_port;
2146
2147         if (!port || op != RES_OP_RESERVE_AND_MAP)
2148                 return -EINVAL;
2149
2150         port = mlx4_slave_convert_port(
2151                         dev, slave, port);
2152
2153         if (port < 0)
2154                 return -EINVAL;
2155         /* upstream kernels had NOP for reg/unreg vlan. Continue this. */
2156         if (!in_port && port > 0 && port <= dev->caps.num_ports) {
2157                 slave_state[slave].old_vlan_api = true;
2158                 return 0;
2159         }
2160
2161         vlan = (u16) in_param;
2162
2163         err = __mlx4_register_vlan(dev, port, vlan, &vlan_index);
2164         if (!err) {
2165                 set_param_l(out_param, (u32) vlan_index);
2166                 err = vlan_add_to_slave(dev, slave, vlan, port, vlan_index);
2167                 if (err)
2168                         __mlx4_unregister_vlan(dev, port, vlan);
2169         }
2170         return err;
2171 }
2172
2173 static int counter_alloc_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2174                              u64 in_param, u64 *out_param, int port)
2175 {
2176         u32 index;
2177         int err;
2178
2179         if (op != RES_OP_RESERVE)
2180                 return -EINVAL;
2181
2182         err = mlx4_grant_resource(dev, slave, RES_COUNTER, 1, 0);
2183         if (err)
2184                 return err;
2185
2186         err = __mlx4_counter_alloc(dev, &index);
2187         if (err) {
2188                 mlx4_release_resource(dev, slave, RES_COUNTER, 1, 0);
2189                 return err;
2190         }
2191
2192         err = add_res_range(dev, slave, index, 1, RES_COUNTER, port);
2193         if (err) {
2194                 __mlx4_counter_free(dev, index);
2195                 mlx4_release_resource(dev, slave, RES_COUNTER, 1, 0);
2196         } else {
2197                 set_param_l(out_param, index);
2198         }
2199
2200         return err;
2201 }
2202
2203 static int xrcdn_alloc_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2204                            u64 in_param, u64 *out_param)
2205 {
2206         u32 xrcdn;
2207         int err;
2208
2209         if (op != RES_OP_RESERVE)
2210                 return -EINVAL;
2211
2212         err = __mlx4_xrcd_alloc(dev, &xrcdn);
2213         if (err)
2214                 return err;
2215
2216         err = add_res_range(dev, slave, xrcdn, 1, RES_XRCD, 0);
2217         if (err)
2218                 __mlx4_xrcd_free(dev, xrcdn);
2219         else
2220                 set_param_l(out_param, xrcdn);
2221
2222         return err;
2223 }
2224
2225 int mlx4_ALLOC_RES_wrapper(struct mlx4_dev *dev, int slave,
2226                            struct mlx4_vhcr *vhcr,
2227                            struct mlx4_cmd_mailbox *inbox,
2228                            struct mlx4_cmd_mailbox *outbox,
2229                            struct mlx4_cmd_info *cmd)
2230 {
2231         int err;
2232         int alop = vhcr->op_modifier;
2233
2234         switch (vhcr->in_modifier & 0xFF) {
2235         case RES_QP:
2236                 err = qp_alloc_res(dev, slave, vhcr->op_modifier, alop,
2237                                    vhcr->in_param, &vhcr->out_param);
2238                 break;
2239
2240         case RES_MTT:
2241                 err = mtt_alloc_res(dev, slave, vhcr->op_modifier, alop,
2242                                     vhcr->in_param, &vhcr->out_param);
2243                 break;
2244
2245         case RES_MPT:
2246                 err = mpt_alloc_res(dev, slave, vhcr->op_modifier, alop,
2247                                     vhcr->in_param, &vhcr->out_param);
2248                 break;
2249
2250         case RES_CQ:
2251                 err = cq_alloc_res(dev, slave, vhcr->op_modifier, alop,
2252                                    vhcr->in_param, &vhcr->out_param);
2253                 break;
2254
2255         case RES_SRQ:
2256                 err = srq_alloc_res(dev, slave, vhcr->op_modifier, alop,
2257                                     vhcr->in_param, &vhcr->out_param);
2258                 break;
2259
2260         case RES_MAC:
2261                 err = mac_alloc_res(dev, slave, vhcr->op_modifier, alop,
2262                                     vhcr->in_param, &vhcr->out_param,
2263                                     (vhcr->in_modifier >> 8) & 0xFF);
2264                 break;
2265
2266         case RES_VLAN:
2267                 err = vlan_alloc_res(dev, slave, vhcr->op_modifier, alop,
2268                                      vhcr->in_param, &vhcr->out_param,
2269                                      (vhcr->in_modifier >> 8) & 0xFF);
2270                 break;
2271
2272         case RES_COUNTER:
2273                 err = counter_alloc_res(dev, slave, vhcr->op_modifier, alop,
2274                                         vhcr->in_param, &vhcr->out_param, 0);
2275                 break;
2276
2277         case RES_XRCD:
2278                 err = xrcdn_alloc_res(dev, slave, vhcr->op_modifier, alop,
2279                                       vhcr->in_param, &vhcr->out_param);
2280                 break;
2281
2282         default:
2283                 err = -EINVAL;
2284                 break;
2285         }
2286
2287         return err;
2288 }
2289
2290 static int qp_free_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2291                        u64 in_param)
2292 {
2293         int err;
2294         int count;
2295         int base;
2296         int qpn;
2297
2298         switch (op) {
2299         case RES_OP_RESERVE:
2300                 base = get_param_l(&in_param) & 0x7fffff;
2301                 count = get_param_h(&in_param);
2302                 err = rem_res_range(dev, slave, base, count, RES_QP, 0);
2303                 if (err)
2304                         break;
2305                 mlx4_release_resource(dev, slave, RES_QP, count, 0);
2306                 __mlx4_qp_release_range(dev, base, count);
2307                 break;
2308         case RES_OP_MAP_ICM:
2309                 qpn = get_param_l(&in_param) & 0x7fffff;
2310                 err = qp_res_start_move_to(dev, slave, qpn, RES_QP_RESERVED,
2311                                            NULL, 0);
2312                 if (err)
2313                         return err;
2314
2315                 if (!fw_reserved(dev, qpn))
2316                         __mlx4_qp_free_icm(dev, qpn);
2317
2318                 res_end_move(dev, slave, RES_QP, qpn);
2319
2320                 if (valid_reserved(dev, slave, qpn))
2321                         err = rem_res_range(dev, slave, qpn, 1, RES_QP, 0);
2322                 break;
2323         default:
2324                 err = -EINVAL;
2325                 break;
2326         }
2327         return err;
2328 }
2329
2330 static int mtt_free_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2331                         u64 in_param, u64 *out_param)
2332 {
2333         int err = -EINVAL;
2334         int base;
2335         int order;
2336
2337         if (op != RES_OP_RESERVE_AND_MAP)
2338                 return err;
2339
2340         base = get_param_l(&in_param);
2341         order = get_param_h(&in_param);
2342         err = rem_res_range(dev, slave, base, 1, RES_MTT, order);
2343         if (!err) {
2344                 mlx4_release_resource(dev, slave, RES_MTT, 1 << order, 0);
2345                 __mlx4_free_mtt_range(dev, base, order);
2346         }
2347         return err;
2348 }
2349
2350 static int mpt_free_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2351                         u64 in_param)
2352 {
2353         int err = -EINVAL;
2354         int index;
2355         int id;
2356         struct res_mpt *mpt;
2357
2358         switch (op) {
2359         case RES_OP_RESERVE:
2360                 index = get_param_l(&in_param);
2361                 id = index & mpt_mask(dev);
2362                 err = get_res(dev, slave, id, RES_MPT, &mpt);
2363                 if (err)
2364                         break;
2365                 index = mpt->key;
2366                 put_res(dev, slave, id, RES_MPT);
2367
2368                 err = rem_res_range(dev, slave, id, 1, RES_MPT, 0);
2369                 if (err)
2370                         break;
2371                 mlx4_release_resource(dev, slave, RES_MPT, 1, 0);
2372                 __mlx4_mpt_release(dev, index);
2373                 break;
2374         case RES_OP_MAP_ICM:
2375                         index = get_param_l(&in_param);
2376                         id = index & mpt_mask(dev);
2377                         err = mr_res_start_move_to(dev, slave, id,
2378                                                    RES_MPT_RESERVED, &mpt);
2379                         if (err)
2380                                 return err;
2381
2382                         __mlx4_mpt_free_icm(dev, mpt->key);
2383                         res_end_move(dev, slave, RES_MPT, id);
2384                         return err;
2385                 break;
2386         default:
2387                 err = -EINVAL;
2388                 break;
2389         }
2390         return err;
2391 }
2392
2393 static int cq_free_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2394                        u64 in_param, u64 *out_param)
2395 {
2396         int cqn;
2397         int err;
2398
2399         switch (op) {
2400         case RES_OP_RESERVE_AND_MAP:
2401                 cqn = get_param_l(&in_param);
2402                 err = rem_res_range(dev, slave, cqn, 1, RES_CQ, 0);
2403                 if (err)
2404                         break;
2405
2406                 mlx4_release_resource(dev, slave, RES_CQ, 1, 0);
2407                 __mlx4_cq_free_icm(dev, cqn);
2408                 break;
2409
2410         default:
2411                 err = -EINVAL;
2412                 break;
2413         }
2414
2415         return err;
2416 }
2417
2418 static int srq_free_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2419                         u64 in_param, u64 *out_param)
2420 {
2421         int srqn;
2422         int err;
2423
2424         switch (op) {
2425         case RES_OP_RESERVE_AND_MAP:
2426                 srqn = get_param_l(&in_param);
2427                 err = rem_res_range(dev, slave, srqn, 1, RES_SRQ, 0);
2428                 if (err)
2429                         break;
2430
2431                 mlx4_release_resource(dev, slave, RES_SRQ, 1, 0);
2432                 __mlx4_srq_free_icm(dev, srqn);
2433                 break;
2434
2435         default:
2436                 err = -EINVAL;
2437                 break;
2438         }
2439
2440         return err;
2441 }
2442
2443 static int mac_free_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2444                             u64 in_param, u64 *out_param, int in_port)
2445 {
2446         int port;
2447         int err = 0;
2448
2449         switch (op) {
2450         case RES_OP_RESERVE_AND_MAP:
2451                 port = !in_port ? get_param_l(out_param) : in_port;
2452                 port = mlx4_slave_convert_port(
2453                                 dev, slave, port);
2454
2455                 if (port < 0)
2456                         return -EINVAL;
2457                 mac_del_from_slave(dev, slave, in_param, port);
2458                 __mlx4_unregister_mac(dev, port, in_param);
2459                 break;
2460         default:
2461                 err = -EINVAL;
2462                 break;
2463         }
2464
2465         return err;
2466
2467 }
2468
2469 static int vlan_free_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2470                             u64 in_param, u64 *out_param, int port)
2471 {
2472         struct mlx4_priv *priv = mlx4_priv(dev);
2473         struct mlx4_slave_state *slave_state = priv->mfunc.master.slave_state;
2474         int err = 0;
2475
2476         port = mlx4_slave_convert_port(
2477                         dev, slave, port);
2478
2479         if (port < 0)
2480                 return -EINVAL;
2481         switch (op) {
2482         case RES_OP_RESERVE_AND_MAP:
2483                 if (slave_state[slave].old_vlan_api)
2484                         return 0;
2485                 if (!port)
2486                         return -EINVAL;
2487                 vlan_del_from_slave(dev, slave, in_param, port);
2488                 __mlx4_unregister_vlan(dev, port, in_param);
2489                 break;
2490         default:
2491                 err = -EINVAL;
2492                 break;
2493         }
2494
2495         return err;
2496 }
2497
2498 static int counter_free_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2499                             u64 in_param, u64 *out_param)
2500 {
2501         int index;
2502         int err;
2503
2504         if (op != RES_OP_RESERVE)
2505                 return -EINVAL;
2506
2507         index = get_param_l(&in_param);
2508         if (index == MLX4_SINK_COUNTER_INDEX(dev))
2509                 return 0;
2510
2511         err = rem_res_range(dev, slave, index, 1, RES_COUNTER, 0);
2512         if (err)
2513                 return err;
2514
2515         __mlx4_counter_free(dev, index);
2516         mlx4_release_resource(dev, slave, RES_COUNTER, 1, 0);
2517
2518         return err;
2519 }
2520
2521 static int xrcdn_free_res(struct mlx4_dev *dev, int slave, int op, int cmd,
2522                           u64 in_param, u64 *out_param)
2523 {
2524         int xrcdn;
2525         int err;
2526
2527         if (op != RES_OP_RESERVE)
2528                 return -EINVAL;
2529
2530         xrcdn = get_param_l(&in_param);
2531         err = rem_res_range(dev, slave, xrcdn, 1, RES_XRCD, 0);
2532         if (err)
2533                 return err;
2534
2535         __mlx4_xrcd_free(dev, xrcdn);
2536
2537         return err;
2538 }
2539
2540 int mlx4_FREE_RES_wrapper(struct mlx4_dev *dev, int slave,
2541                           struct mlx4_vhcr *vhcr,
2542                           struct mlx4_cmd_mailbox *inbox,
2543                           struct mlx4_cmd_mailbox *outbox,
2544                           struct mlx4_cmd_info *cmd)
2545 {
2546         int err = -EINVAL;
2547         int alop = vhcr->op_modifier;
2548
2549         switch (vhcr->in_modifier & 0xFF) {
2550         case RES_QP:
2551                 err = qp_free_res(dev, slave, vhcr->op_modifier, alop,
2552                                   vhcr->in_param);
2553                 break;
2554
2555         case RES_MTT:
2556                 err = mtt_free_res(dev, slave, vhcr->op_modifier, alop,
2557                                    vhcr->in_param, &vhcr->out_param);
2558                 break;
2559
2560         case RES_MPT:
2561                 err = mpt_free_res(dev, slave, vhcr->op_modifier, alop,
2562                                    vhcr->in_param);
2563                 break;
2564
2565         case RES_CQ:
2566                 err = cq_free_res(dev, slave, vhcr->op_modifier, alop,
2567                                   vhcr->in_param, &vhcr->out_param);
2568                 break;
2569
2570         case RES_SRQ:
2571                 err = srq_free_res(dev, slave, vhcr->op_modifier, alop,
2572                                    vhcr->in_param, &vhcr->out_param);
2573                 break;
2574
2575         case RES_MAC:
2576                 err = mac_free_res(dev, slave, vhcr->op_modifier, alop,
2577                                    vhcr->in_param, &vhcr->out_param,
2578                                    (vhcr->in_modifier >> 8) & 0xFF);
2579                 break;
2580
2581         case RES_VLAN:
2582                 err = vlan_free_res(dev, slave, vhcr->op_modifier, alop,
2583                                     vhcr->in_param, &vhcr->out_param,
2584                                     (vhcr->in_modifier >> 8) & 0xFF);
2585                 break;
2586
2587         case RES_COUNTER:
2588                 err = counter_free_res(dev, slave, vhcr->op_modifier, alop,
2589                                        vhcr->in_param, &vhcr->out_param);
2590                 break;
2591
2592         case RES_XRCD:
2593                 err = xrcdn_free_res(dev, slave, vhcr->op_modifier, alop,
2594                                      vhcr->in_param, &vhcr->out_param);
2595
2596         default:
2597                 break;
2598         }
2599         return err;
2600 }
2601
2602 /* ugly but other choices are uglier */
2603 static int mr_phys_mpt(struct mlx4_mpt_entry *mpt)
2604 {
2605         return (be32_to_cpu(mpt->flags) >> 9) & 1;
2606 }
2607
2608 static int mr_get_mtt_addr(struct mlx4_mpt_entry *mpt)
2609 {
2610         return (int)be64_to_cpu(mpt->mtt_addr) & 0xfffffff8;
2611 }
2612
2613 static int mr_get_mtt_size(struct mlx4_mpt_entry *mpt)
2614 {
2615         return be32_to_cpu(mpt->mtt_sz);
2616 }
2617
2618 static u32 mr_get_pd(struct mlx4_mpt_entry *mpt)
2619 {
2620         return be32_to_cpu(mpt->pd_flags) & 0x00ffffff;
2621 }
2622
2623 static int mr_is_fmr(struct mlx4_mpt_entry *mpt)
2624 {
2625         return be32_to_cpu(mpt->pd_flags) & MLX4_MPT_PD_FLAG_FAST_REG;
2626 }
2627
2628 static int mr_is_bind_enabled(struct mlx4_mpt_entry *mpt)
2629 {
2630         return be32_to_cpu(mpt->flags) & MLX4_MPT_FLAG_BIND_ENABLE;
2631 }
2632
2633 static int mr_is_region(struct mlx4_mpt_entry *mpt)
2634 {
2635         return be32_to_cpu(mpt->flags) & MLX4_MPT_FLAG_REGION;
2636 }
2637
2638 static int qp_get_mtt_addr(struct mlx4_qp_context *qpc)
2639 {
2640         return be32_to_cpu(qpc->mtt_base_addr_l) & 0xfffffff8;
2641 }
2642
2643 static int srq_get_mtt_addr(struct mlx4_srq_context *srqc)
2644 {
2645         return be32_to_cpu(srqc->mtt_base_addr_l) & 0xfffffff8;
2646 }
2647
2648 static int qp_get_mtt_size(struct mlx4_qp_context *qpc)
2649 {
2650         int page_shift = (qpc->log_page_size & 0x3f) + 12;
2651         int log_sq_size = (qpc->sq_size_stride >> 3) & 0xf;
2652         int log_sq_sride = qpc->sq_size_stride & 7;
2653         int log_rq_size = (qpc->rq_size_stride >> 3) & 0xf;
2654         int log_rq_stride = qpc->rq_size_stride & 7;
2655         int srq = (be32_to_cpu(qpc->srqn) >> 24) & 1;
2656         int rss = (be32_to_cpu(qpc->flags) >> 13) & 1;
2657         u32 ts = (be32_to_cpu(qpc->flags) >> 16) & 0xff;
2658         int xrc = (ts == MLX4_QP_ST_XRC) ? 1 : 0;
2659         int sq_size;
2660         int rq_size;
2661         int total_pages;
2662         int total_mem;
2663         int page_offset = (be32_to_cpu(qpc->params2) >> 6) & 0x3f;
2664
2665         sq_size = 1 << (log_sq_size + log_sq_sride + 4);
2666         rq_size = (srq|rss|xrc) ? 0 : (1 << (log_rq_size + log_rq_stride + 4));
2667         total_mem = sq_size + rq_size;
2668         total_pages =
2669                 roundup_pow_of_two((total_mem + (page_offset << 6)) >>
2670                                    page_shift);
2671
2672         return total_pages;
2673 }
2674
2675 static int check_mtt_range(struct mlx4_dev *dev, int slave, int start,
2676                            int size, struct res_mtt *mtt)
2677 {
2678         int res_start = mtt->com.res_id;
2679         int res_size = (1 << mtt->order);
2680
2681         if (start < res_start || start + size > res_start + res_size)
2682                 return -EPERM;
2683         return 0;
2684 }
2685
2686 int mlx4_SW2HW_MPT_wrapper(struct mlx4_dev *dev, int slave,
2687                            struct mlx4_vhcr *vhcr,
2688                            struct mlx4_cmd_mailbox *inbox,
2689                            struct mlx4_cmd_mailbox *outbox,
2690                            struct mlx4_cmd_info *cmd)
2691 {
2692         int err;
2693         int index = vhcr->in_modifier;
2694         struct res_mtt *mtt;
2695         struct res_mpt *mpt;
2696         int mtt_base = mr_get_mtt_addr(inbox->buf) / dev->caps.mtt_entry_sz;
2697         int phys;
2698         int id;
2699         u32 pd;
2700         int pd_slave;
2701
2702         id = index & mpt_mask(dev);
2703         err = mr_res_start_move_to(dev, slave, id, RES_MPT_HW, &mpt);
2704         if (err)
2705                 return err;
2706
2707         /* Disable memory windows for VFs. */
2708         if (!mr_is_region(inbox->buf)) {
2709                 err = -EPERM;
2710                 goto ex_abort;
2711         }
2712
2713         /* Make sure that the PD bits related to the slave id are zeros. */
2714         pd = mr_get_pd(inbox->buf);
2715         pd_slave = (pd >> 17) & 0x7f;
2716         if (pd_slave != 0 && --pd_slave != slave) {
2717                 err = -EPERM;
2718                 goto ex_abort;
2719         }
2720
2721         if (mr_is_fmr(inbox->buf)) {
2722                 /* FMR and Bind Enable are forbidden in slave devices. */
2723                 if (mr_is_bind_enabled(inbox->buf)) {
2724                         err = -EPERM;
2725                         goto ex_abort;
2726                 }
2727                 /* FMR and Memory Windows are also forbidden. */
2728                 if (!mr_is_region(inbox->buf)) {
2729                         err = -EPERM;
2730                         goto ex_abort;
2731                 }
2732         }
2733
2734         phys = mr_phys_mpt(inbox->buf);
2735         if (!phys) {
2736                 err = get_res(dev, slave, mtt_base, RES_MTT, &mtt);
2737                 if (err)
2738                         goto ex_abort;
2739
2740                 err = check_mtt_range(dev, slave, mtt_base,
2741                                       mr_get_mtt_size(inbox->buf), mtt);
2742                 if (err)
2743                         goto ex_put;
2744
2745                 mpt->mtt = mtt;
2746         }
2747
2748         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
2749         if (err)
2750                 goto ex_put;
2751
2752         if (!phys) {
2753                 atomic_inc(&mtt->ref_count);
2754                 put_res(dev, slave, mtt->com.res_id, RES_MTT);
2755         }
2756
2757         res_end_move(dev, slave, RES_MPT, id);
2758         return 0;
2759
2760 ex_put:
2761         if (!phys)
2762                 put_res(dev, slave, mtt->com.res_id, RES_MTT);
2763 ex_abort:
2764         res_abort_move(dev, slave, RES_MPT, id);
2765
2766         return err;
2767 }
2768
2769 int mlx4_HW2SW_MPT_wrapper(struct mlx4_dev *dev, int slave,
2770                            struct mlx4_vhcr *vhcr,
2771                            struct mlx4_cmd_mailbox *inbox,
2772                            struct mlx4_cmd_mailbox *outbox,
2773                            struct mlx4_cmd_info *cmd)
2774 {
2775         int err;
2776         int index = vhcr->in_modifier;
2777         struct res_mpt *mpt;
2778         int id;
2779
2780         id = index & mpt_mask(dev);
2781         err = mr_res_start_move_to(dev, slave, id, RES_MPT_MAPPED, &mpt);
2782         if (err)
2783                 return err;
2784
2785         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
2786         if (err)
2787                 goto ex_abort;
2788
2789         if (mpt->mtt)
2790                 atomic_dec(&mpt->mtt->ref_count);
2791
2792         res_end_move(dev, slave, RES_MPT, id);
2793         return 0;
2794
2795 ex_abort:
2796         res_abort_move(dev, slave, RES_MPT, id);
2797
2798         return err;
2799 }
2800
2801 int mlx4_QUERY_MPT_wrapper(struct mlx4_dev *dev, int slave,
2802                            struct mlx4_vhcr *vhcr,
2803                            struct mlx4_cmd_mailbox *inbox,
2804                            struct mlx4_cmd_mailbox *outbox,
2805                            struct mlx4_cmd_info *cmd)
2806 {
2807         int err;
2808         int index = vhcr->in_modifier;
2809         struct res_mpt *mpt;
2810         int id;
2811
2812         id = index & mpt_mask(dev);
2813         err = get_res(dev, slave, id, RES_MPT, &mpt);
2814         if (err)
2815                 return err;
2816
2817         if (mpt->com.from_state == RES_MPT_MAPPED) {
2818                 /* In order to allow rereg in SRIOV, we need to alter the MPT entry. To do
2819                  * that, the VF must read the MPT. But since the MPT entry memory is not
2820                  * in the VF's virtual memory space, it must use QUERY_MPT to obtain the
2821                  * entry contents. To guarantee that the MPT cannot be changed, the driver
2822                  * must perform HW2SW_MPT before this query and return the MPT entry to HW
2823                  * ownership fofollowing the change. The change here allows the VF to
2824                  * perform QUERY_MPT also when the entry is in SW ownership.
2825                  */
2826                 struct mlx4_mpt_entry *mpt_entry = mlx4_table_find(
2827                                         &mlx4_priv(dev)->mr_table.dmpt_table,
2828                                         mpt->key, NULL);
2829
2830                 if (NULL == mpt_entry || NULL == outbox->buf) {
2831                         err = -EINVAL;
2832                         goto out;
2833                 }
2834
2835                 memcpy(outbox->buf, mpt_entry, sizeof(*mpt_entry));
2836
2837                 err = 0;
2838         } else if (mpt->com.from_state == RES_MPT_HW) {
2839                 err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
2840         } else {
2841                 err = -EBUSY;
2842                 goto out;
2843         }
2844
2845
2846 out:
2847         put_res(dev, slave, id, RES_MPT);
2848         return err;
2849 }
2850
2851 static int qp_get_rcqn(struct mlx4_qp_context *qpc)
2852 {
2853         return be32_to_cpu(qpc->cqn_recv) & 0xffffff;
2854 }
2855
2856 static int qp_get_scqn(struct mlx4_qp_context *qpc)
2857 {
2858         return be32_to_cpu(qpc->cqn_send) & 0xffffff;
2859 }
2860
2861 static u32 qp_get_srqn(struct mlx4_qp_context *qpc)
2862 {
2863         return be32_to_cpu(qpc->srqn) & 0x1ffffff;
2864 }
2865
2866 static void adjust_proxy_tun_qkey(struct mlx4_dev *dev, struct mlx4_vhcr *vhcr,
2867                                   struct mlx4_qp_context *context)
2868 {
2869         u32 qpn = vhcr->in_modifier & 0xffffff;
2870         u32 qkey = 0;
2871
2872         if (mlx4_get_parav_qkey(dev, qpn, &qkey))
2873                 return;
2874
2875         /* adjust qkey in qp context */
2876         context->qkey = cpu_to_be32(qkey);
2877 }
2878
2879 static int adjust_qp_sched_queue(struct mlx4_dev *dev, int slave,
2880                                  struct mlx4_qp_context *qpc,
2881                                  struct mlx4_cmd_mailbox *inbox);
2882
2883 int mlx4_RST2INIT_QP_wrapper(struct mlx4_dev *dev, int slave,
2884                              struct mlx4_vhcr *vhcr,
2885                              struct mlx4_cmd_mailbox *inbox,
2886                              struct mlx4_cmd_mailbox *outbox,
2887                              struct mlx4_cmd_info *cmd)
2888 {
2889         int err;
2890         int qpn = vhcr->in_modifier & 0x7fffff;
2891         struct res_mtt *mtt;
2892         struct res_qp *qp;
2893         struct mlx4_qp_context *qpc = inbox->buf + 8;
2894         int mtt_base = qp_get_mtt_addr(qpc) / dev->caps.mtt_entry_sz;
2895         int mtt_size = qp_get_mtt_size(qpc);
2896         struct res_cq *rcq;
2897         struct res_cq *scq;
2898         int rcqn = qp_get_rcqn(qpc);
2899         int scqn = qp_get_scqn(qpc);
2900         u32 srqn = qp_get_srqn(qpc) & 0xffffff;
2901         int use_srq = (qp_get_srqn(qpc) >> 24) & 1;
2902         struct res_srq *srq;
2903         int local_qpn = be32_to_cpu(qpc->local_qpn) & 0xffffff;
2904
2905         err = adjust_qp_sched_queue(dev, slave, qpc, inbox);
2906         if (err)
2907                 return err;
2908
2909         err = qp_res_start_move_to(dev, slave, qpn, RES_QP_HW, &qp, 0);
2910         if (err)
2911                 return err;
2912         qp->local_qpn = local_qpn;
2913         qp->sched_queue = 0;
2914         qp->param3 = 0;
2915         qp->vlan_control = 0;
2916         qp->fvl_rx = 0;
2917         qp->pri_path_fl = 0;
2918         qp->vlan_index = 0;
2919         qp->feup = 0;
2920         qp->qpc_flags = be32_to_cpu(qpc->flags);
2921
2922         err = get_res(dev, slave, mtt_base, RES_MTT, &mtt);
2923         if (err)
2924                 goto ex_abort;
2925
2926         err = check_mtt_range(dev, slave, mtt_base, mtt_size, mtt);
2927         if (err)
2928                 goto ex_put_mtt;
2929
2930         err = get_res(dev, slave, rcqn, RES_CQ, &rcq);
2931         if (err)
2932                 goto ex_put_mtt;
2933
2934         if (scqn != rcqn) {
2935                 err = get_res(dev, slave, scqn, RES_CQ, &scq);
2936                 if (err)
2937                         goto ex_put_rcq;
2938         } else
2939                 scq = rcq;
2940
2941         if (use_srq) {
2942                 err = get_res(dev, slave, srqn, RES_SRQ, &srq);
2943                 if (err)
2944                         goto ex_put_scq;
2945         }
2946
2947         adjust_proxy_tun_qkey(dev, vhcr, qpc);
2948         update_pkey_index(dev, slave, inbox);
2949         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
2950         if (err)
2951                 goto ex_put_srq;
2952         atomic_inc(&mtt->ref_count);
2953         qp->mtt = mtt;
2954         atomic_inc(&rcq->ref_count);
2955         qp->rcq = rcq;
2956         atomic_inc(&scq->ref_count);
2957         qp->scq = scq;
2958
2959         if (scqn != rcqn)
2960                 put_res(dev, slave, scqn, RES_CQ);
2961
2962         if (use_srq) {
2963                 atomic_inc(&srq->ref_count);
2964                 put_res(dev, slave, srqn, RES_SRQ);
2965                 qp->srq = srq;
2966         }
2967         put_res(dev, slave, rcqn, RES_CQ);
2968         put_res(dev, slave, mtt_base, RES_MTT);
2969         res_end_move(dev, slave, RES_QP, qpn);
2970
2971         return 0;
2972
2973 ex_put_srq:
2974         if (use_srq)
2975                 put_res(dev, slave, srqn, RES_SRQ);
2976 ex_put_scq:
2977         if (scqn != rcqn)
2978                 put_res(dev, slave, scqn, RES_CQ);
2979 ex_put_rcq:
2980         put_res(dev, slave, rcqn, RES_CQ);
2981 ex_put_mtt:
2982         put_res(dev, slave, mtt_base, RES_MTT);
2983 ex_abort:
2984         res_abort_move(dev, slave, RES_QP, qpn);
2985
2986         return err;
2987 }
2988
2989 static int eq_get_mtt_addr(struct mlx4_eq_context *eqc)
2990 {
2991         return be32_to_cpu(eqc->mtt_base_addr_l) & 0xfffffff8;
2992 }
2993
2994 static int eq_get_mtt_size(struct mlx4_eq_context *eqc)
2995 {
2996         int log_eq_size = eqc->log_eq_size & 0x1f;
2997         int page_shift = (eqc->log_page_size & 0x3f) + 12;
2998
2999         if (log_eq_size + 5 < page_shift)
3000                 return 1;
3001
3002         return 1 << (log_eq_size + 5 - page_shift);
3003 }
3004
3005 static int cq_get_mtt_addr(struct mlx4_cq_context *cqc)
3006 {
3007         return be32_to_cpu(cqc->mtt_base_addr_l) & 0xfffffff8;
3008 }
3009
3010 static int cq_get_mtt_size(struct mlx4_cq_context *cqc)
3011 {
3012         int log_cq_size = (be32_to_cpu(cqc->logsize_usrpage) >> 24) & 0x1f;
3013         int page_shift = (cqc->log_page_size & 0x3f) + 12;
3014
3015         if (log_cq_size + 5 < page_shift)
3016                 return 1;
3017
3018         return 1 << (log_cq_size + 5 - page_shift);
3019 }
3020
3021 int mlx4_SW2HW_EQ_wrapper(struct mlx4_dev *dev, int slave,
3022                           struct mlx4_vhcr *vhcr,
3023                           struct mlx4_cmd_mailbox *inbox,
3024                           struct mlx4_cmd_mailbox *outbox,
3025                           struct mlx4_cmd_info *cmd)
3026 {
3027         int err;
3028         int eqn = vhcr->in_modifier;
3029         int res_id = (slave << 10) | eqn;
3030         struct mlx4_eq_context *eqc = inbox->buf;
3031         int mtt_base = eq_get_mtt_addr(eqc) / dev->caps.mtt_entry_sz;
3032         int mtt_size = eq_get_mtt_size(eqc);
3033         struct res_eq *eq;
3034         struct res_mtt *mtt;
3035
3036         err = add_res_range(dev, slave, res_id, 1, RES_EQ, 0);
3037         if (err)
3038                 return err;
3039         err = eq_res_start_move_to(dev, slave, res_id, RES_EQ_HW, &eq);
3040         if (err)
3041                 goto out_add;
3042
3043         err = get_res(dev, slave, mtt_base, RES_MTT, &mtt);
3044         if (err)
3045                 goto out_move;
3046
3047         err = check_mtt_range(dev, slave, mtt_base, mtt_size, mtt);
3048         if (err)
3049                 goto out_put;
3050
3051         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3052         if (err)
3053                 goto out_put;
3054
3055         atomic_inc(&mtt->ref_count);
3056         eq->mtt = mtt;
3057         put_res(dev, slave, mtt->com.res_id, RES_MTT);
3058         res_end_move(dev, slave, RES_EQ, res_id);
3059         return 0;
3060
3061 out_put:
3062         put_res(dev, slave, mtt->com.res_id, RES_MTT);
3063 out_move:
3064         res_abort_move(dev, slave, RES_EQ, res_id);
3065 out_add:
3066         rem_res_range(dev, slave, res_id, 1, RES_EQ, 0);
3067         return err;
3068 }
3069
3070 int mlx4_CONFIG_DEV_wrapper(struct mlx4_dev *dev, int slave,
3071                             struct mlx4_vhcr *vhcr,
3072                             struct mlx4_cmd_mailbox *inbox,
3073                             struct mlx4_cmd_mailbox *outbox,
3074                             struct mlx4_cmd_info *cmd)
3075 {
3076         int err;
3077         u8 get = vhcr->op_modifier;
3078
3079         if (get != 1)
3080                 return -EPERM;
3081
3082         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3083
3084         return err;
3085 }
3086
3087 static int get_containing_mtt(struct mlx4_dev *dev, int slave, int start,
3088                               int len, struct res_mtt **res)
3089 {
3090         struct mlx4_priv *priv = mlx4_priv(dev);
3091         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
3092         struct res_mtt *mtt;
3093         int err = -EINVAL;
3094
3095         spin_lock_irq(mlx4_tlock(dev));
3096         list_for_each_entry(mtt, &tracker->slave_list[slave].res_list[RES_MTT],
3097                             com.list) {
3098                 if (!check_mtt_range(dev, slave, start, len, mtt)) {
3099                         *res = mtt;
3100                         mtt->com.from_state = mtt->com.state;
3101                         mtt->com.state = RES_MTT_BUSY;
3102                         err = 0;
3103                         break;
3104                 }
3105         }
3106         spin_unlock_irq(mlx4_tlock(dev));
3107
3108         return err;
3109 }
3110
3111 static int verify_qp_parameters(struct mlx4_dev *dev,
3112                                 struct mlx4_vhcr *vhcr,
3113                                 struct mlx4_cmd_mailbox *inbox,
3114                                 enum qp_transition transition, u8 slave)
3115 {
3116         u32                     qp_type;
3117         u32                     qpn;
3118         struct mlx4_qp_context  *qp_ctx;
3119         enum mlx4_qp_optpar     optpar;
3120         int port;
3121         int num_gids;
3122
3123         qp_ctx  = inbox->buf + 8;
3124         qp_type = (be32_to_cpu(qp_ctx->flags) >> 16) & 0xff;
3125         optpar  = be32_to_cpu(*(__be32 *) inbox->buf);
3126
3127         if (slave != mlx4_master_func_num(dev)) {
3128                 qp_ctx->params2 &= ~MLX4_QP_BIT_FPP;
3129                 /* setting QP rate-limit is disallowed for VFs */
3130                 if (qp_ctx->rate_limit_params)
3131                         return -EPERM;
3132         }
3133
3134         switch (qp_type) {
3135         case MLX4_QP_ST_RC:
3136         case MLX4_QP_ST_XRC:
3137         case MLX4_QP_ST_UC:
3138                 switch (transition) {
3139                 case QP_TRANS_INIT2RTR:
3140                 case QP_TRANS_RTR2RTS:
3141                 case QP_TRANS_RTS2RTS:
3142                 case QP_TRANS_SQD2SQD:
3143                 case QP_TRANS_SQD2RTS:
3144                         if (slave != mlx4_master_func_num(dev))
3145                                 if (optpar & MLX4_QP_OPTPAR_PRIMARY_ADDR_PATH) {
3146                                         port = (qp_ctx->pri_path.sched_queue >> 6 & 1) + 1;
3147                                         if (dev->caps.port_mask[port] != MLX4_PORT_TYPE_IB)
3148                                                 num_gids = mlx4_get_slave_num_gids(dev, slave, port);
3149                                         else
3150                                                 num_gids = 1;
3151                                         if (qp_ctx->pri_path.mgid_index >= num_gids)
3152                                                 return -EINVAL;
3153                                 }
3154                                 if (optpar & MLX4_QP_OPTPAR_ALT_ADDR_PATH) {
3155                                         port = (qp_ctx->alt_path.sched_queue >> 6 & 1) + 1;
3156                                         if (dev->caps.port_mask[port] != MLX4_PORT_TYPE_IB)
3157                                                 num_gids = mlx4_get_slave_num_gids(dev, slave, port);
3158                                         else
3159                                                 num_gids = 1;
3160                                         if (qp_ctx->alt_path.mgid_index >= num_gids)
3161                                                 return -EINVAL;
3162                                 }
3163                         break;
3164                 default:
3165                         break;
3166                 }
3167                 break;
3168
3169         case MLX4_QP_ST_MLX:
3170                 qpn = vhcr->in_modifier & 0x7fffff;
3171                 port = (qp_ctx->pri_path.sched_queue >> 6 & 1) + 1;
3172                 if (transition == QP_TRANS_INIT2RTR &&
3173                     slave != mlx4_master_func_num(dev) &&
3174                     mlx4_is_qp_reserved(dev, qpn) &&
3175                     !mlx4_vf_smi_enabled(dev, slave, port)) {
3176                         /* only enabled VFs may create MLX proxy QPs */
3177                         mlx4_err(dev, "%s: unprivileged slave %d attempting to create an MLX proxy special QP on port %d\n",
3178                                  __func__, slave, port);
3179                         return -EPERM;
3180                 }
3181                 break;
3182
3183         default:
3184                 break;
3185         }
3186
3187         return 0;
3188 }
3189
3190 int mlx4_WRITE_MTT_wrapper(struct mlx4_dev *dev, int slave,
3191                            struct mlx4_vhcr *vhcr,
3192                            struct mlx4_cmd_mailbox *inbox,
3193                            struct mlx4_cmd_mailbox *outbox,
3194                            struct mlx4_cmd_info *cmd)
3195 {
3196         struct mlx4_mtt mtt;
3197         __be64 *page_list = inbox->buf;
3198         u64 *pg_list = (u64 *)page_list;
3199         int i;
3200         struct res_mtt *rmtt = NULL;
3201         int start = be64_to_cpu(page_list[0]);
3202         int npages = vhcr->in_modifier;
3203         int err;
3204
3205         err = get_containing_mtt(dev, slave, start, npages, &rmtt);
3206         if (err)
3207                 return err;
3208
3209         /* Call the SW implementation of write_mtt:
3210          * - Prepare a dummy mtt struct
3211          * - Translate inbox contents to simple addresses in host endianness */
3212         mtt.offset = 0;  /* TBD this is broken but I don't handle it since
3213                             we don't really use it */
3214         mtt.order = 0;
3215         mtt.page_shift = 0;
3216         for (i = 0; i < npages; ++i)
3217                 pg_list[i + 2] = (be64_to_cpu(page_list[i + 2]) & ~1ULL);
3218
3219         err = __mlx4_write_mtt(dev, &mtt, be64_to_cpu(page_list[0]), npages,
3220                                ((u64 *)page_list + 2));
3221
3222         if (rmtt)
3223                 put_res(dev, slave, rmtt->com.res_id, RES_MTT);
3224
3225         return err;
3226 }
3227
3228 int mlx4_HW2SW_EQ_wrapper(struct mlx4_dev *dev, int slave,
3229                           struct mlx4_vhcr *vhcr,
3230                           struct mlx4_cmd_mailbox *inbox,
3231                           struct mlx4_cmd_mailbox *outbox,
3232                           struct mlx4_cmd_info *cmd)
3233 {
3234         int eqn = vhcr->in_modifier;
3235         int res_id = eqn | (slave << 10);
3236         struct res_eq *eq;
3237         int err;
3238
3239         err = eq_res_start_move_to(dev, slave, res_id, RES_EQ_RESERVED, &eq);
3240         if (err)
3241                 return err;
3242
3243         err = get_res(dev, slave, eq->mtt->com.res_id, RES_MTT, NULL);
3244         if (err)
3245                 goto ex_abort;
3246
3247         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3248         if (err)
3249                 goto ex_put;
3250
3251         atomic_dec(&eq->mtt->ref_count);
3252         put_res(dev, slave, eq->mtt->com.res_id, RES_MTT);
3253         res_end_move(dev, slave, RES_EQ, res_id);
3254         rem_res_range(dev, slave, res_id, 1, RES_EQ, 0);
3255
3256         return 0;
3257
3258 ex_put:
3259         put_res(dev, slave, eq->mtt->com.res_id, RES_MTT);
3260 ex_abort:
3261         res_abort_move(dev, slave, RES_EQ, res_id);
3262
3263         return err;
3264 }
3265
3266 int mlx4_GEN_EQE(struct mlx4_dev *dev, int slave, struct mlx4_eqe *eqe)
3267 {
3268         struct mlx4_priv *priv = mlx4_priv(dev);
3269         struct mlx4_slave_event_eq_info *event_eq;
3270         struct mlx4_cmd_mailbox *mailbox;
3271         u32 in_modifier = 0;
3272         int err;
3273         int res_id;
3274         struct res_eq *req;
3275
3276         if (!priv->mfunc.master.slave_state)
3277                 return -EINVAL;
3278
3279         /* check for slave valid, slave not PF, and slave active */
3280         if (slave < 0 || slave > dev->persist->num_vfs ||
3281             slave == dev->caps.function ||
3282             !priv->mfunc.master.slave_state[slave].active)
3283                 return 0;
3284
3285         event_eq = &priv->mfunc.master.slave_state[slave].event_eq[eqe->type];
3286
3287         /* Create the event only if the slave is registered */
3288         if (event_eq->eqn < 0)
3289                 return 0;
3290
3291         mutex_lock(&priv->mfunc.master.gen_eqe_mutex[slave]);
3292         res_id = (slave << 10) | event_eq->eqn;
3293         err = get_res(dev, slave, res_id, RES_EQ, &req);
3294         if (err)
3295                 goto unlock;
3296
3297         if (req->com.from_state != RES_EQ_HW) {
3298                 err = -EINVAL;
3299                 goto put;
3300         }
3301
3302         mailbox = mlx4_alloc_cmd_mailbox(dev);
3303         if (IS_ERR(mailbox)) {
3304                 err = PTR_ERR(mailbox);
3305                 goto put;
3306         }
3307
3308         if (eqe->type == MLX4_EVENT_TYPE_CMD) {
3309                 ++event_eq->token;
3310                 eqe->event.cmd.token = cpu_to_be16(event_eq->token);
3311         }
3312
3313         memcpy(mailbox->buf, (u8 *) eqe, 28);
3314
3315         in_modifier = (slave & 0xff) | ((event_eq->eqn & 0x3ff) << 16);
3316
3317         err = mlx4_cmd(dev, mailbox->dma, in_modifier, 0,
3318                        MLX4_CMD_GEN_EQE, MLX4_CMD_TIME_CLASS_B,
3319                        MLX4_CMD_NATIVE);
3320
3321         put_res(dev, slave, res_id, RES_EQ);
3322         mutex_unlock(&priv->mfunc.master.gen_eqe_mutex[slave]);
3323         mlx4_free_cmd_mailbox(dev, mailbox);
3324         return err;
3325
3326 put:
3327         put_res(dev, slave, res_id, RES_EQ);
3328
3329 unlock:
3330         mutex_unlock(&priv->mfunc.master.gen_eqe_mutex[slave]);
3331         return err;
3332 }
3333
3334 int mlx4_QUERY_EQ_wrapper(struct mlx4_dev *dev, int slave,
3335                           struct mlx4_vhcr *vhcr,
3336                           struct mlx4_cmd_mailbox *inbox,
3337                           struct mlx4_cmd_mailbox *outbox,
3338                           struct mlx4_cmd_info *cmd)
3339 {
3340         int eqn = vhcr->in_modifier;
3341         int res_id = eqn | (slave << 10);
3342         struct res_eq *eq;
3343         int err;
3344
3345         err = get_res(dev, slave, res_id, RES_EQ, &eq);
3346         if (err)
3347                 return err;
3348
3349         if (eq->com.from_state != RES_EQ_HW) {
3350                 err = -EINVAL;
3351                 goto ex_put;
3352         }
3353
3354         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3355
3356 ex_put:
3357         put_res(dev, slave, res_id, RES_EQ);
3358         return err;
3359 }
3360
3361 int mlx4_SW2HW_CQ_wrapper(struct mlx4_dev *dev, int slave,
3362                           struct mlx4_vhcr *vhcr,
3363                           struct mlx4_cmd_mailbox *inbox,
3364                           struct mlx4_cmd_mailbox *outbox,
3365                           struct mlx4_cmd_info *cmd)
3366 {
3367         int err;
3368         int cqn = vhcr->in_modifier;
3369         struct mlx4_cq_context *cqc = inbox->buf;
3370         int mtt_base = cq_get_mtt_addr(cqc) / dev->caps.mtt_entry_sz;
3371         struct res_cq *cq = NULL;
3372         struct res_mtt *mtt;
3373
3374         err = cq_res_start_move_to(dev, slave, cqn, RES_CQ_HW, &cq);
3375         if (err)
3376                 return err;
3377         err = get_res(dev, slave, mtt_base, RES_MTT, &mtt);
3378         if (err)
3379                 goto out_move;
3380         err = check_mtt_range(dev, slave, mtt_base, cq_get_mtt_size(cqc), mtt);
3381         if (err)
3382                 goto out_put;
3383         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3384         if (err)
3385                 goto out_put;
3386         atomic_inc(&mtt->ref_count);
3387         cq->mtt = mtt;
3388         put_res(dev, slave, mtt->com.res_id, RES_MTT);
3389         res_end_move(dev, slave, RES_CQ, cqn);
3390         return 0;
3391
3392 out_put:
3393         put_res(dev, slave, mtt->com.res_id, RES_MTT);
3394 out_move:
3395         res_abort_move(dev, slave, RES_CQ, cqn);
3396         return err;
3397 }
3398
3399 int mlx4_HW2SW_CQ_wrapper(struct mlx4_dev *dev, int slave,
3400                           struct mlx4_vhcr *vhcr,
3401                           struct mlx4_cmd_mailbox *inbox,
3402                           struct mlx4_cmd_mailbox *outbox,
3403                           struct mlx4_cmd_info *cmd)
3404 {
3405         int err;
3406         int cqn = vhcr->in_modifier;
3407         struct res_cq *cq = NULL;
3408
3409         err = cq_res_start_move_to(dev, slave, cqn, RES_CQ_ALLOCATED, &cq);
3410         if (err)
3411                 return err;
3412         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3413         if (err)
3414                 goto out_move;
3415         atomic_dec(&cq->mtt->ref_count);
3416         res_end_move(dev, slave, RES_CQ, cqn);
3417         return 0;
3418
3419 out_move:
3420         res_abort_move(dev, slave, RES_CQ, cqn);
3421         return err;
3422 }
3423
3424 int mlx4_QUERY_CQ_wrapper(struct mlx4_dev *dev, int slave,
3425                           struct mlx4_vhcr *vhcr,
3426                           struct mlx4_cmd_mailbox *inbox,
3427                           struct mlx4_cmd_mailbox *outbox,
3428                           struct mlx4_cmd_info *cmd)
3429 {
3430         int cqn = vhcr->in_modifier;
3431         struct res_cq *cq;
3432         int err;
3433
3434         err = get_res(dev, slave, cqn, RES_CQ, &cq);
3435         if (err)
3436                 return err;
3437
3438         if (cq->com.from_state != RES_CQ_HW)
3439                 goto ex_put;
3440
3441         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3442 ex_put:
3443         put_res(dev, slave, cqn, RES_CQ);
3444
3445         return err;
3446 }
3447
3448 static int handle_resize(struct mlx4_dev *dev, int slave,
3449                          struct mlx4_vhcr *vhcr,
3450                          struct mlx4_cmd_mailbox *inbox,
3451                          struct mlx4_cmd_mailbox *outbox,
3452                          struct mlx4_cmd_info *cmd,
3453                          struct res_cq *cq)
3454 {
3455         int err;
3456         struct res_mtt *orig_mtt;
3457         struct res_mtt *mtt;
3458         struct mlx4_cq_context *cqc = inbox->buf;
3459         int mtt_base = cq_get_mtt_addr(cqc) / dev->caps.mtt_entry_sz;
3460
3461         err = get_res(dev, slave, cq->mtt->com.res_id, RES_MTT, &orig_mtt);
3462         if (err)
3463                 return err;
3464
3465         if (orig_mtt != cq->mtt) {
3466                 err = -EINVAL;
3467                 goto ex_put;
3468         }
3469
3470         err = get_res(dev, slave, mtt_base, RES_MTT, &mtt);
3471         if (err)
3472                 goto ex_put;
3473
3474         err = check_mtt_range(dev, slave, mtt_base, cq_get_mtt_size(cqc), mtt);
3475         if (err)
3476                 goto ex_put1;
3477         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3478         if (err)
3479                 goto ex_put1;
3480         atomic_dec(&orig_mtt->ref_count);
3481         put_res(dev, slave, orig_mtt->com.res_id, RES_MTT);
3482         atomic_inc(&mtt->ref_count);
3483         cq->mtt = mtt;
3484         put_res(dev, slave, mtt->com.res_id, RES_MTT);
3485         return 0;
3486
3487 ex_put1:
3488         put_res(dev, slave, mtt->com.res_id, RES_MTT);
3489 ex_put:
3490         put_res(dev, slave, orig_mtt->com.res_id, RES_MTT);
3491
3492         return err;
3493
3494 }
3495
3496 int mlx4_MODIFY_CQ_wrapper(struct mlx4_dev *dev, int slave,
3497                            struct mlx4_vhcr *vhcr,
3498                            struct mlx4_cmd_mailbox *inbox,
3499                            struct mlx4_cmd_mailbox *outbox,
3500                            struct mlx4_cmd_info *cmd)
3501 {
3502         int cqn = vhcr->in_modifier;
3503         struct res_cq *cq;
3504         int err;
3505
3506         err = get_res(dev, slave, cqn, RES_CQ, &cq);
3507         if (err)
3508                 return err;
3509
3510         if (cq->com.from_state != RES_CQ_HW)
3511                 goto ex_put;
3512
3513         if (vhcr->op_modifier == 0) {
3514                 err = handle_resize(dev, slave, vhcr, inbox, outbox, cmd, cq);
3515                 goto ex_put;
3516         }
3517
3518         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3519 ex_put:
3520         put_res(dev, slave, cqn, RES_CQ);
3521
3522         return err;
3523 }
3524
3525 static int srq_get_mtt_size(struct mlx4_srq_context *srqc)
3526 {
3527         int log_srq_size = (be32_to_cpu(srqc->state_logsize_srqn) >> 24) & 0xf;
3528         int log_rq_stride = srqc->logstride & 7;
3529         int page_shift = (srqc->log_page_size & 0x3f) + 12;
3530
3531         if (log_srq_size + log_rq_stride + 4 < page_shift)
3532                 return 1;
3533
3534         return 1 << (log_srq_size + log_rq_stride + 4 - page_shift);
3535 }
3536
3537 int mlx4_SW2HW_SRQ_wrapper(struct mlx4_dev *dev, int slave,
3538                            struct mlx4_vhcr *vhcr,
3539                            struct mlx4_cmd_mailbox *inbox,
3540                            struct mlx4_cmd_mailbox *outbox,
3541                            struct mlx4_cmd_info *cmd)
3542 {
3543         int err;
3544         int srqn = vhcr->in_modifier;
3545         struct res_mtt *mtt;
3546         struct res_srq *srq = NULL;
3547         struct mlx4_srq_context *srqc = inbox->buf;
3548         int mtt_base = srq_get_mtt_addr(srqc) / dev->caps.mtt_entry_sz;
3549
3550         if (srqn != (be32_to_cpu(srqc->state_logsize_srqn) & 0xffffff))
3551                 return -EINVAL;
3552
3553         err = srq_res_start_move_to(dev, slave, srqn, RES_SRQ_HW, &srq);
3554         if (err)
3555                 return err;
3556         err = get_res(dev, slave, mtt_base, RES_MTT, &mtt);
3557         if (err)
3558                 goto ex_abort;
3559         err = check_mtt_range(dev, slave, mtt_base, srq_get_mtt_size(srqc),
3560                               mtt);
3561         if (err)
3562                 goto ex_put_mtt;
3563
3564         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3565         if (err)
3566                 goto ex_put_mtt;
3567
3568         atomic_inc(&mtt->ref_count);
3569         srq->mtt = mtt;
3570         put_res(dev, slave, mtt->com.res_id, RES_MTT);
3571         res_end_move(dev, slave, RES_SRQ, srqn);
3572         return 0;
3573
3574 ex_put_mtt:
3575         put_res(dev, slave, mtt->com.res_id, RES_MTT);
3576 ex_abort:
3577         res_abort_move(dev, slave, RES_SRQ, srqn);
3578
3579         return err;
3580 }
3581
3582 int mlx4_HW2SW_SRQ_wrapper(struct mlx4_dev *dev, int slave,
3583                            struct mlx4_vhcr *vhcr,
3584                            struct mlx4_cmd_mailbox *inbox,
3585                            struct mlx4_cmd_mailbox *outbox,
3586                            struct mlx4_cmd_info *cmd)
3587 {
3588         int err;
3589         int srqn = vhcr->in_modifier;
3590         struct res_srq *srq = NULL;
3591
3592         err = srq_res_start_move_to(dev, slave, srqn, RES_SRQ_ALLOCATED, &srq);
3593         if (err)
3594                 return err;
3595         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3596         if (err)
3597                 goto ex_abort;
3598         atomic_dec(&srq->mtt->ref_count);
3599         if (srq->cq)
3600                 atomic_dec(&srq->cq->ref_count);
3601         res_end_move(dev, slave, RES_SRQ, srqn);
3602
3603         return 0;
3604
3605 ex_abort:
3606         res_abort_move(dev, slave, RES_SRQ, srqn);
3607
3608         return err;
3609 }
3610
3611 int mlx4_QUERY_SRQ_wrapper(struct mlx4_dev *dev, int slave,
3612                            struct mlx4_vhcr *vhcr,
3613                            struct mlx4_cmd_mailbox *inbox,
3614                            struct mlx4_cmd_mailbox *outbox,
3615                            struct mlx4_cmd_info *cmd)
3616 {
3617         int err;
3618         int srqn = vhcr->in_modifier;
3619         struct res_srq *srq;
3620
3621         err = get_res(dev, slave, srqn, RES_SRQ, &srq);
3622         if (err)
3623                 return err;
3624         if (srq->com.from_state != RES_SRQ_HW) {
3625                 err = -EBUSY;
3626                 goto out;
3627         }
3628         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3629 out:
3630         put_res(dev, slave, srqn, RES_SRQ);
3631         return err;
3632 }
3633
3634 int mlx4_ARM_SRQ_wrapper(struct mlx4_dev *dev, int slave,
3635                          struct mlx4_vhcr *vhcr,
3636                          struct mlx4_cmd_mailbox *inbox,
3637                          struct mlx4_cmd_mailbox *outbox,
3638                          struct mlx4_cmd_info *cmd)
3639 {
3640         int err;
3641         int srqn = vhcr->in_modifier;
3642         struct res_srq *srq;
3643
3644         err = get_res(dev, slave, srqn, RES_SRQ, &srq);
3645         if (err)
3646                 return err;
3647
3648         if (srq->com.from_state != RES_SRQ_HW) {
3649                 err = -EBUSY;
3650                 goto out;
3651         }
3652
3653         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3654 out:
3655         put_res(dev, slave, srqn, RES_SRQ);
3656         return err;
3657 }
3658
3659 int mlx4_GEN_QP_wrapper(struct mlx4_dev *dev, int slave,
3660                         struct mlx4_vhcr *vhcr,
3661                         struct mlx4_cmd_mailbox *inbox,
3662                         struct mlx4_cmd_mailbox *outbox,
3663                         struct mlx4_cmd_info *cmd)
3664 {
3665         int err;
3666         int qpn = vhcr->in_modifier & 0x7fffff;
3667         struct res_qp *qp;
3668
3669         err = get_res(dev, slave, qpn, RES_QP, &qp);
3670         if (err)
3671                 return err;
3672         if (qp->com.from_state != RES_QP_HW) {
3673                 err = -EBUSY;
3674                 goto out;
3675         }
3676
3677         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3678 out:
3679         put_res(dev, slave, qpn, RES_QP);
3680         return err;
3681 }
3682
3683 int mlx4_INIT2INIT_QP_wrapper(struct mlx4_dev *dev, int slave,
3684                               struct mlx4_vhcr *vhcr,
3685                               struct mlx4_cmd_mailbox *inbox,
3686                               struct mlx4_cmd_mailbox *outbox,
3687                               struct mlx4_cmd_info *cmd)
3688 {
3689         struct mlx4_qp_context *context = inbox->buf + 8;
3690         adjust_proxy_tun_qkey(dev, vhcr, context);
3691         update_pkey_index(dev, slave, inbox);
3692         return mlx4_GEN_QP_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3693 }
3694
3695 static int adjust_qp_sched_queue(struct mlx4_dev *dev, int slave,
3696                                   struct mlx4_qp_context *qpc,
3697                                   struct mlx4_cmd_mailbox *inbox)
3698 {
3699         enum mlx4_qp_optpar optpar = be32_to_cpu(*(__be32 *)inbox->buf);
3700         u8 pri_sched_queue;
3701         int port = mlx4_slave_convert_port(
3702                    dev, slave, (qpc->pri_path.sched_queue >> 6 & 1) + 1) - 1;
3703
3704         if (port < 0)
3705                 return -EINVAL;
3706
3707         pri_sched_queue = (qpc->pri_path.sched_queue & ~(1 << 6)) |
3708                           ((port & 1) << 6);
3709
3710         if (optpar & (MLX4_QP_OPTPAR_PRIMARY_ADDR_PATH | MLX4_QP_OPTPAR_SCHED_QUEUE) ||
3711             qpc->pri_path.sched_queue || mlx4_is_eth(dev, port + 1)) {
3712                 qpc->pri_path.sched_queue = pri_sched_queue;
3713         }
3714
3715         if (optpar & MLX4_QP_OPTPAR_ALT_ADDR_PATH) {
3716                 port = mlx4_slave_convert_port(
3717                                 dev, slave, (qpc->alt_path.sched_queue >> 6 & 1)
3718                                 + 1) - 1;
3719                 if (port < 0)
3720                         return -EINVAL;
3721                 qpc->alt_path.sched_queue =
3722                         (qpc->alt_path.sched_queue & ~(1 << 6)) |
3723                         (port & 1) << 6;
3724         }
3725         return 0;
3726 }
3727
3728 static int roce_verify_mac(struct mlx4_dev *dev, int slave,
3729                                 struct mlx4_qp_context *qpc,
3730                                 struct mlx4_cmd_mailbox *inbox)
3731 {
3732         u64 mac;
3733         int port;
3734         u32 ts = (be32_to_cpu(qpc->flags) >> 16) & 0xff;
3735         u8 sched = *(u8 *)(inbox->buf + 64);
3736         u8 smac_ix;
3737
3738         port = (sched >> 6 & 1) + 1;
3739         if (mlx4_is_eth(dev, port) && (ts != MLX4_QP_ST_MLX)) {
3740                 smac_ix = qpc->pri_path.grh_mylmc & 0x7f;
3741                 if (mac_find_smac_ix_in_slave(dev, slave, port, smac_ix, &mac))
3742                         return -ENOENT;
3743         }
3744         return 0;
3745 }
3746
3747 int mlx4_INIT2RTR_QP_wrapper(struct mlx4_dev *dev, int slave,
3748                              struct mlx4_vhcr *vhcr,
3749                              struct mlx4_cmd_mailbox *inbox,
3750                              struct mlx4_cmd_mailbox *outbox,
3751                              struct mlx4_cmd_info *cmd)
3752 {
3753         int err;
3754         struct mlx4_qp_context *qpc = inbox->buf + 8;
3755         int qpn = vhcr->in_modifier & 0x7fffff;
3756         struct res_qp *qp;
3757         u8 orig_sched_queue;
3758         __be32  orig_param3 = qpc->param3;
3759         u8 orig_vlan_control = qpc->pri_path.vlan_control;
3760         u8 orig_fvl_rx = qpc->pri_path.fvl_rx;
3761         u8 orig_pri_path_fl = qpc->pri_path.fl;
3762         u8 orig_vlan_index = qpc->pri_path.vlan_index;
3763         u8 orig_feup = qpc->pri_path.feup;
3764
3765         err = adjust_qp_sched_queue(dev, slave, qpc, inbox);
3766         if (err)
3767                 return err;
3768         err = verify_qp_parameters(dev, vhcr, inbox, QP_TRANS_INIT2RTR, slave);
3769         if (err)
3770                 return err;
3771
3772         if (roce_verify_mac(dev, slave, qpc, inbox))
3773                 return -EINVAL;
3774
3775         update_pkey_index(dev, slave, inbox);
3776         update_gid(dev, inbox, (u8)slave);
3777         adjust_proxy_tun_qkey(dev, vhcr, qpc);
3778         orig_sched_queue = qpc->pri_path.sched_queue;
3779
3780         err = get_res(dev, slave, qpn, RES_QP, &qp);
3781         if (err)
3782                 return err;
3783         if (qp->com.from_state != RES_QP_HW) {
3784                 err = -EBUSY;
3785                 goto out;
3786         }
3787
3788         err = update_vport_qp_param(dev, inbox, slave, qpn);
3789         if (err)
3790                 goto out;
3791
3792         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3793 out:
3794         /* if no error, save sched queue value passed in by VF. This is
3795          * essentially the QOS value provided by the VF. This will be useful
3796          * if we allow dynamic changes from VST back to VGT
3797          */
3798         if (!err) {
3799                 qp->sched_queue = orig_sched_queue;
3800                 qp->param3      = orig_param3;
3801                 qp->vlan_control = orig_vlan_control;
3802                 qp->fvl_rx      =  orig_fvl_rx;
3803                 qp->pri_path_fl = orig_pri_path_fl;
3804                 qp->vlan_index  = orig_vlan_index;
3805                 qp->feup        = orig_feup;
3806         }
3807         put_res(dev, slave, qpn, RES_QP);
3808         return err;
3809 }
3810
3811 int mlx4_RTR2RTS_QP_wrapper(struct mlx4_dev *dev, int slave,
3812                             struct mlx4_vhcr *vhcr,
3813                             struct mlx4_cmd_mailbox *inbox,
3814                             struct mlx4_cmd_mailbox *outbox,
3815                             struct mlx4_cmd_info *cmd)
3816 {
3817         int err;
3818         struct mlx4_qp_context *context = inbox->buf + 8;
3819
3820         err = adjust_qp_sched_queue(dev, slave, context, inbox);
3821         if (err)
3822                 return err;
3823         err = verify_qp_parameters(dev, vhcr, inbox, QP_TRANS_RTR2RTS, slave);
3824         if (err)
3825                 return err;
3826
3827         update_pkey_index(dev, slave, inbox);
3828         update_gid(dev, inbox, (u8)slave);
3829         adjust_proxy_tun_qkey(dev, vhcr, context);
3830         return mlx4_GEN_QP_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3831 }
3832
3833 int mlx4_RTS2RTS_QP_wrapper(struct mlx4_dev *dev, int slave,
3834                             struct mlx4_vhcr *vhcr,
3835                             struct mlx4_cmd_mailbox *inbox,
3836                             struct mlx4_cmd_mailbox *outbox,
3837                             struct mlx4_cmd_info *cmd)
3838 {
3839         int err;
3840         struct mlx4_qp_context *context = inbox->buf + 8;
3841
3842         err = adjust_qp_sched_queue(dev, slave, context, inbox);
3843         if (err)
3844                 return err;
3845         err = verify_qp_parameters(dev, vhcr, inbox, QP_TRANS_RTS2RTS, slave);
3846         if (err)
3847                 return err;
3848
3849         update_pkey_index(dev, slave, inbox);
3850         update_gid(dev, inbox, (u8)slave);
3851         adjust_proxy_tun_qkey(dev, vhcr, context);
3852         return mlx4_GEN_QP_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3853 }
3854
3855
3856 int mlx4_SQERR2RTS_QP_wrapper(struct mlx4_dev *dev, int slave,
3857                               struct mlx4_vhcr *vhcr,
3858                               struct mlx4_cmd_mailbox *inbox,
3859                               struct mlx4_cmd_mailbox *outbox,
3860                               struct mlx4_cmd_info *cmd)
3861 {
3862         struct mlx4_qp_context *context = inbox->buf + 8;
3863         int err = adjust_qp_sched_queue(dev, slave, context, inbox);
3864         if (err)
3865                 return err;
3866         adjust_proxy_tun_qkey(dev, vhcr, context);
3867         return mlx4_GEN_QP_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3868 }
3869
3870 int mlx4_SQD2SQD_QP_wrapper(struct mlx4_dev *dev, int slave,
3871                             struct mlx4_vhcr *vhcr,
3872                             struct mlx4_cmd_mailbox *inbox,
3873                             struct mlx4_cmd_mailbox *outbox,
3874                             struct mlx4_cmd_info *cmd)
3875 {
3876         int err;
3877         struct mlx4_qp_context *context = inbox->buf + 8;
3878
3879         err = adjust_qp_sched_queue(dev, slave, context, inbox);
3880         if (err)
3881                 return err;
3882         err = verify_qp_parameters(dev, vhcr, inbox, QP_TRANS_SQD2SQD, slave);
3883         if (err)
3884                 return err;
3885
3886         adjust_proxy_tun_qkey(dev, vhcr, context);
3887         update_gid(dev, inbox, (u8)slave);
3888         update_pkey_index(dev, slave, inbox);
3889         return mlx4_GEN_QP_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3890 }
3891
3892 int mlx4_SQD2RTS_QP_wrapper(struct mlx4_dev *dev, int slave,
3893                             struct mlx4_vhcr *vhcr,
3894                             struct mlx4_cmd_mailbox *inbox,
3895                             struct mlx4_cmd_mailbox *outbox,
3896                             struct mlx4_cmd_info *cmd)
3897 {
3898         int err;
3899         struct mlx4_qp_context *context = inbox->buf + 8;
3900
3901         err = adjust_qp_sched_queue(dev, slave, context, inbox);
3902         if (err)
3903                 return err;
3904         err = verify_qp_parameters(dev, vhcr, inbox, QP_TRANS_SQD2RTS, slave);
3905         if (err)
3906                 return err;
3907
3908         adjust_proxy_tun_qkey(dev, vhcr, context);
3909         update_gid(dev, inbox, (u8)slave);
3910         update_pkey_index(dev, slave, inbox);
3911         return mlx4_GEN_QP_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3912 }
3913
3914 int mlx4_2RST_QP_wrapper(struct mlx4_dev *dev, int slave,
3915                          struct mlx4_vhcr *vhcr,
3916                          struct mlx4_cmd_mailbox *inbox,
3917                          struct mlx4_cmd_mailbox *outbox,
3918                          struct mlx4_cmd_info *cmd)
3919 {
3920         int err;
3921         int qpn = vhcr->in_modifier & 0x7fffff;
3922         struct res_qp *qp;
3923
3924         err = qp_res_start_move_to(dev, slave, qpn, RES_QP_MAPPED, &qp, 0);
3925         if (err)
3926                 return err;
3927         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
3928         if (err)
3929                 goto ex_abort;
3930
3931         atomic_dec(&qp->mtt->ref_count);
3932         atomic_dec(&qp->rcq->ref_count);
3933         atomic_dec(&qp->scq->ref_count);
3934         if (qp->srq)
3935                 atomic_dec(&qp->srq->ref_count);
3936         res_end_move(dev, slave, RES_QP, qpn);
3937         return 0;
3938
3939 ex_abort:
3940         res_abort_move(dev, slave, RES_QP, qpn);
3941
3942         return err;
3943 }
3944
3945 static struct res_gid *find_gid(struct mlx4_dev *dev, int slave,
3946                                 struct res_qp *rqp, u8 *gid)
3947 {
3948         struct res_gid *res;
3949
3950         list_for_each_entry(res, &rqp->mcg_list, list) {
3951                 if (!memcmp(res->gid, gid, 16))
3952                         return res;
3953         }
3954         return NULL;
3955 }
3956
3957 static int add_mcg_res(struct mlx4_dev *dev, int slave, struct res_qp *rqp,
3958                        u8 *gid, enum mlx4_protocol prot,
3959                        enum mlx4_steer_type steer, u64 reg_id)
3960 {
3961         struct res_gid *res;
3962         int err;
3963
3964         res = kzalloc(sizeof *res, GFP_KERNEL);
3965         if (!res)
3966                 return -ENOMEM;
3967
3968         spin_lock_irq(&rqp->mcg_spl);
3969         if (find_gid(dev, slave, rqp, gid)) {
3970                 kfree(res);
3971                 err = -EEXIST;
3972         } else {
3973                 memcpy(res->gid, gid, 16);
3974                 res->prot = prot;
3975                 res->steer = steer;
3976                 res->reg_id = reg_id;
3977                 list_add_tail(&res->list, &rqp->mcg_list);
3978                 err = 0;
3979         }
3980         spin_unlock_irq(&rqp->mcg_spl);
3981
3982         return err;
3983 }
3984
3985 static int rem_mcg_res(struct mlx4_dev *dev, int slave, struct res_qp *rqp,
3986                        u8 *gid, enum mlx4_protocol prot,
3987                        enum mlx4_steer_type steer, u64 *reg_id)
3988 {
3989         struct res_gid *res;
3990         int err;
3991
3992         spin_lock_irq(&rqp->mcg_spl);
3993         res = find_gid(dev, slave, rqp, gid);
3994         if (!res || res->prot != prot || res->steer != steer)
3995                 err = -EINVAL;
3996         else {
3997                 *reg_id = res->reg_id;
3998                 list_del(&res->list);
3999                 kfree(res);
4000                 err = 0;
4001         }
4002         spin_unlock_irq(&rqp->mcg_spl);
4003
4004         return err;
4005 }
4006
4007 static int qp_attach(struct mlx4_dev *dev, int slave, struct mlx4_qp *qp,
4008                      u8 gid[16], int block_loopback, enum mlx4_protocol prot,
4009                      enum mlx4_steer_type type, u64 *reg_id)
4010 {
4011         switch (dev->caps.steering_mode) {
4012         case MLX4_STEERING_MODE_DEVICE_MANAGED: {
4013                 int port = mlx4_slave_convert_port(dev, slave, gid[5]);
4014                 if (port < 0)
4015                         return port;
4016                 return mlx4_trans_to_dmfs_attach(dev, qp, gid, port,
4017                                                 block_loopback, prot,
4018                                                 reg_id);
4019         }
4020         case MLX4_STEERING_MODE_B0:
4021                 if (prot == MLX4_PROT_ETH) {
4022                         int port = mlx4_slave_convert_port(dev, slave, gid[5]);
4023                         if (port < 0)
4024                                 return port;
4025                         gid[5] = port;
4026                 }
4027                 return mlx4_qp_attach_common(dev, qp, gid,
4028                                             block_loopback, prot, type);
4029         default:
4030                 return -EINVAL;
4031         }
4032 }
4033
4034 static int qp_detach(struct mlx4_dev *dev, struct mlx4_qp *qp,
4035                      u8 gid[16], enum mlx4_protocol prot,
4036                      enum mlx4_steer_type type, u64 reg_id)
4037 {
4038         switch (dev->caps.steering_mode) {
4039         case MLX4_STEERING_MODE_DEVICE_MANAGED:
4040                 return mlx4_flow_detach(dev, reg_id);
4041         case MLX4_STEERING_MODE_B0:
4042                 return mlx4_qp_detach_common(dev, qp, gid, prot, type);
4043         default:
4044                 return -EINVAL;
4045         }
4046 }
4047
4048 static int mlx4_adjust_port(struct mlx4_dev *dev, int slave,
4049                             u8 *gid, enum mlx4_protocol prot)
4050 {
4051         int real_port;
4052
4053         if (prot != MLX4_PROT_ETH)
4054                 return 0;
4055
4056         if (dev->caps.steering_mode == MLX4_STEERING_MODE_B0 ||
4057             dev->caps.steering_mode == MLX4_STEERING_MODE_DEVICE_MANAGED) {
4058                 real_port = mlx4_slave_convert_port(dev, slave, gid[5]);
4059                 if (real_port < 0)
4060                         return -EINVAL;
4061                 gid[5] = real_port;
4062         }
4063
4064         return 0;
4065 }
4066
4067 int mlx4_QP_ATTACH_wrapper(struct mlx4_dev *dev, int slave,
4068                                struct mlx4_vhcr *vhcr,
4069                                struct mlx4_cmd_mailbox *inbox,
4070                                struct mlx4_cmd_mailbox *outbox,
4071                                struct mlx4_cmd_info *cmd)
4072 {
4073         struct mlx4_qp qp; /* dummy for calling attach/detach */
4074         u8 *gid = inbox->buf;
4075         enum mlx4_protocol prot = (vhcr->in_modifier >> 28) & 0x7;
4076         int err;
4077         int qpn;
4078         struct res_qp *rqp;
4079         u64 reg_id = 0;
4080         int attach = vhcr->op_modifier;
4081         int block_loopback = vhcr->in_modifier >> 31;
4082         u8 steer_type_mask = 2;
4083         enum mlx4_steer_type type = (gid[7] & steer_type_mask) >> 1;
4084
4085         qpn = vhcr->in_modifier & 0xffffff;
4086         err = get_res(dev, slave, qpn, RES_QP, &rqp);
4087         if (err)
4088                 return err;
4089
4090         qp.qpn = qpn;
4091         if (attach) {
4092                 err = qp_attach(dev, slave, &qp, gid, block_loopback, prot,
4093                                 type, &reg_id);
4094                 if (err) {
4095                         pr_err("Fail to attach rule to qp 0x%x\n", qpn);
4096                         goto ex_put;
4097                 }
4098                 err = add_mcg_res(dev, slave, rqp, gid, prot, type, reg_id);
4099                 if (err)
4100                         goto ex_detach;
4101         } else {
4102                 err = mlx4_adjust_port(dev, slave, gid, prot);
4103                 if (err)
4104                         goto ex_put;
4105
4106                 err = rem_mcg_res(dev, slave, rqp, gid, prot, type, &reg_id);
4107                 if (err)
4108                         goto ex_put;
4109
4110                 err = qp_detach(dev, &qp, gid, prot, type, reg_id);
4111                 if (err)
4112                         pr_err("Fail to detach rule from qp 0x%x reg_id = 0x%llx\n",
4113                                qpn, reg_id);
4114         }
4115         put_res(dev, slave, qpn, RES_QP);
4116         return err;
4117
4118 ex_detach:
4119         qp_detach(dev, &qp, gid, prot, type, reg_id);
4120 ex_put:
4121         put_res(dev, slave, qpn, RES_QP);
4122         return err;
4123 }
4124
4125 /*
4126  * MAC validation for Flow Steering rules.
4127  * VF can attach rules only with a mac address which is assigned to it.
4128  */
4129 static int validate_eth_header_mac(int slave, struct _rule_hw *eth_header,
4130                                    struct list_head *rlist)
4131 {
4132         struct mac_res *res, *tmp;
4133         __be64 be_mac;
4134
4135         /* make sure it isn't multicast or broadcast mac*/
4136         if (!is_multicast_ether_addr(eth_header->eth.dst_mac) &&
4137             !is_broadcast_ether_addr(eth_header->eth.dst_mac)) {
4138                 list_for_each_entry_safe(res, tmp, rlist, list) {
4139                         be_mac = cpu_to_be64(res->mac << 16);
4140                         if (ether_addr_equal((u8 *)&be_mac, eth_header->eth.dst_mac))
4141                                 return 0;
4142                 }
4143                 pr_err("MAC %pM doesn't belong to VF %d, Steering rule rejected\n",
4144                        eth_header->eth.dst_mac, slave);
4145                 return -EINVAL;
4146         }
4147         return 0;
4148 }
4149
4150 static void handle_eth_header_mcast_prio(struct mlx4_net_trans_rule_hw_ctrl *ctrl,
4151                                          struct _rule_hw *eth_header)
4152 {
4153         if (is_multicast_ether_addr(eth_header->eth.dst_mac) ||
4154             is_broadcast_ether_addr(eth_header->eth.dst_mac)) {
4155                 struct mlx4_net_trans_rule_hw_eth *eth =
4156                         (struct mlx4_net_trans_rule_hw_eth *)eth_header;
4157                 struct _rule_hw *next_rule = (struct _rule_hw *)(eth + 1);
4158                 bool last_rule = next_rule->size == 0 && next_rule->id == 0 &&
4159                         next_rule->rsvd == 0;
4160
4161                 if (last_rule)
4162                         ctrl->prio = cpu_to_be16(MLX4_DOMAIN_NIC);
4163         }
4164 }
4165
4166 /*
4167  * In case of missing eth header, append eth header with a MAC address
4168  * assigned to the VF.
4169  */
4170 static int add_eth_header(struct mlx4_dev *dev, int slave,
4171                           struct mlx4_cmd_mailbox *inbox,
4172                           struct list_head *rlist, int header_id)
4173 {
4174         struct mac_res *res, *tmp;
4175         u8 port;
4176         struct mlx4_net_trans_rule_hw_ctrl *ctrl;
4177         struct mlx4_net_trans_rule_hw_eth *eth_header;
4178         struct mlx4_net_trans_rule_hw_ipv4 *ip_header;
4179         struct mlx4_net_trans_rule_hw_tcp_udp *l4_header;
4180         __be64 be_mac = 0;
4181         __be64 mac_msk = cpu_to_be64(MLX4_MAC_MASK << 16);
4182
4183         ctrl = (struct mlx4_net_trans_rule_hw_ctrl *)inbox->buf;
4184         port = ctrl->port;
4185         eth_header = (struct mlx4_net_trans_rule_hw_eth *)(ctrl + 1);
4186
4187         /* Clear a space in the inbox for eth header */
4188         switch (header_id) {
4189         case MLX4_NET_TRANS_RULE_ID_IPV4:
4190                 ip_header =
4191                         (struct mlx4_net_trans_rule_hw_ipv4 *)(eth_header + 1);
4192                 memmove(ip_header, eth_header,
4193                         sizeof(*ip_header) + sizeof(*l4_header));
4194                 break;
4195         case MLX4_NET_TRANS_RULE_ID_TCP:
4196         case MLX4_NET_TRANS_RULE_ID_UDP:
4197                 l4_header = (struct mlx4_net_trans_rule_hw_tcp_udp *)
4198                             (eth_header + 1);
4199                 memmove(l4_header, eth_header, sizeof(*l4_header));
4200                 break;
4201         default:
4202                 return -EINVAL;
4203         }
4204         list_for_each_entry_safe(res, tmp, rlist, list) {
4205                 if (port == res->port) {
4206                         be_mac = cpu_to_be64(res->mac << 16);
4207                         break;
4208                 }
4209         }
4210         if (!be_mac) {
4211                 pr_err("Failed adding eth header to FS rule, Can't find matching MAC for port %d\n",
4212                        port);
4213                 return -EINVAL;
4214         }
4215
4216         memset(eth_header, 0, sizeof(*eth_header));
4217         eth_header->size = sizeof(*eth_header) >> 2;
4218         eth_header->id = cpu_to_be16(__sw_id_hw[MLX4_NET_TRANS_RULE_ID_ETH]);
4219         memcpy(eth_header->dst_mac, &be_mac, ETH_ALEN);
4220         memcpy(eth_header->dst_mac_msk, &mac_msk, ETH_ALEN);
4221
4222         return 0;
4223
4224 }
4225
4226 #define MLX4_UPD_QP_PATH_MASK_SUPPORTED      (                                \
4227         1ULL << MLX4_UPD_QP_PATH_MASK_MAC_INDEX                     |\
4228         1ULL << MLX4_UPD_QP_PATH_MASK_ETH_SRC_CHECK_MC_LB)
4229 int mlx4_UPDATE_QP_wrapper(struct mlx4_dev *dev, int slave,
4230                            struct mlx4_vhcr *vhcr,
4231                            struct mlx4_cmd_mailbox *inbox,
4232                            struct mlx4_cmd_mailbox *outbox,
4233                            struct mlx4_cmd_info *cmd_info)
4234 {
4235         int err;
4236         u32 qpn = vhcr->in_modifier & 0xffffff;
4237         struct res_qp *rqp;
4238         u64 mac;
4239         unsigned port;
4240         u64 pri_addr_path_mask;
4241         struct mlx4_update_qp_context *cmd;
4242         int smac_index;
4243
4244         cmd = (struct mlx4_update_qp_context *)inbox->buf;
4245
4246         pri_addr_path_mask = be64_to_cpu(cmd->primary_addr_path_mask);
4247         if (cmd->qp_mask || cmd->secondary_addr_path_mask ||
4248             (pri_addr_path_mask & ~MLX4_UPD_QP_PATH_MASK_SUPPORTED))
4249                 return -EPERM;
4250
4251         if ((pri_addr_path_mask &
4252              (1ULL << MLX4_UPD_QP_PATH_MASK_ETH_SRC_CHECK_MC_LB)) &&
4253                 !(dev->caps.flags2 &
4254                   MLX4_DEV_CAP_FLAG2_UPDATE_QP_SRC_CHECK_LB)) {
4255                         mlx4_warn(dev,
4256                                   "Src check LB for slave %d isn't supported\n",
4257                                    slave);
4258                 return -ENOTSUPP;
4259         }
4260
4261         /* Just change the smac for the QP */
4262         err = get_res(dev, slave, qpn, RES_QP, &rqp);
4263         if (err) {
4264                 mlx4_err(dev, "Updating qpn 0x%x for slave %d rejected\n", qpn, slave);
4265                 return err;
4266         }
4267
4268         port = (rqp->sched_queue >> 6 & 1) + 1;
4269
4270         if (pri_addr_path_mask & (1ULL << MLX4_UPD_QP_PATH_MASK_MAC_INDEX)) {
4271                 smac_index = cmd->qp_context.pri_path.grh_mylmc;
4272                 err = mac_find_smac_ix_in_slave(dev, slave, port,
4273                                                 smac_index, &mac);
4274
4275                 if (err) {
4276                         mlx4_err(dev, "Failed to update qpn 0x%x, MAC is invalid. smac_ix: %d\n",
4277                                  qpn, smac_index);
4278                         goto err_mac;
4279                 }
4280         }
4281
4282         err = mlx4_cmd(dev, inbox->dma,
4283                        vhcr->in_modifier, 0,
4284                        MLX4_CMD_UPDATE_QP, MLX4_CMD_TIME_CLASS_A,
4285                        MLX4_CMD_NATIVE);
4286         if (err) {
4287                 mlx4_err(dev, "Failed to update qpn on qpn 0x%x, command failed\n", qpn);
4288                 goto err_mac;
4289         }
4290
4291 err_mac:
4292         put_res(dev, slave, qpn, RES_QP);
4293         return err;
4294 }
4295
4296 static u32 qp_attach_mbox_size(void *mbox)
4297 {
4298         u32 size = sizeof(struct mlx4_net_trans_rule_hw_ctrl);
4299         struct _rule_hw  *rule_header;
4300
4301         rule_header = (struct _rule_hw *)(mbox + size);
4302
4303         while (rule_header->size) {
4304                 size += rule_header->size * sizeof(u32);
4305                 rule_header += 1;
4306         }
4307         return size;
4308 }
4309
4310 static int mlx4_do_mirror_rule(struct mlx4_dev *dev, struct res_fs_rule *fs_rule);
4311
4312 int mlx4_QP_FLOW_STEERING_ATTACH_wrapper(struct mlx4_dev *dev, int slave,
4313                                          struct mlx4_vhcr *vhcr,
4314                                          struct mlx4_cmd_mailbox *inbox,
4315                                          struct mlx4_cmd_mailbox *outbox,
4316                                          struct mlx4_cmd_info *cmd)
4317 {
4318
4319         struct mlx4_priv *priv = mlx4_priv(dev);
4320         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
4321         struct list_head *rlist = &tracker->slave_list[slave].res_list[RES_MAC];
4322         int err;
4323         int qpn;
4324         struct res_qp *rqp;
4325         struct mlx4_net_trans_rule_hw_ctrl *ctrl;
4326         struct _rule_hw  *rule_header;
4327         int header_id;
4328         struct res_fs_rule *rrule;
4329         u32 mbox_size;
4330
4331         if (dev->caps.steering_mode !=
4332             MLX4_STEERING_MODE_DEVICE_MANAGED)
4333                 return -EOPNOTSUPP;
4334
4335         ctrl = (struct mlx4_net_trans_rule_hw_ctrl *)inbox->buf;
4336         err = mlx4_slave_convert_port(dev, slave, ctrl->port);
4337         if (err <= 0)
4338                 return -EINVAL;
4339         ctrl->port = err;
4340         qpn = be32_to_cpu(ctrl->qpn) & 0xffffff;
4341         err = get_res(dev, slave, qpn, RES_QP, &rqp);
4342         if (err) {
4343                 pr_err("Steering rule with qpn 0x%x rejected\n", qpn);
4344                 return err;
4345         }
4346         rule_header = (struct _rule_hw *)(ctrl + 1);
4347         header_id = map_hw_to_sw_id(be16_to_cpu(rule_header->id));
4348
4349         if (header_id == MLX4_NET_TRANS_RULE_ID_ETH)
4350                 handle_eth_header_mcast_prio(ctrl, rule_header);
4351
4352         if (slave == dev->caps.function)
4353                 goto execute;
4354
4355         switch (header_id) {
4356         case MLX4_NET_TRANS_RULE_ID_ETH:
4357                 if (validate_eth_header_mac(slave, rule_header, rlist)) {
4358                         err = -EINVAL;
4359                         goto err_put_qp;
4360                 }
4361                 break;
4362         case MLX4_NET_TRANS_RULE_ID_IB:
4363                 break;
4364         case MLX4_NET_TRANS_RULE_ID_IPV4:
4365         case MLX4_NET_TRANS_RULE_ID_TCP:
4366         case MLX4_NET_TRANS_RULE_ID_UDP:
4367                 pr_warn("Can't attach FS rule without L2 headers, adding L2 header\n");
4368                 if (add_eth_header(dev, slave, inbox, rlist, header_id)) {
4369                         err = -EINVAL;
4370                         goto err_put_qp;
4371                 }
4372                 vhcr->in_modifier +=
4373                         sizeof(struct mlx4_net_trans_rule_hw_eth) >> 2;
4374                 break;
4375         default:
4376                 pr_err("Corrupted mailbox\n");
4377                 err = -EINVAL;
4378                 goto err_put_qp;
4379         }
4380
4381 execute:
4382         err = mlx4_cmd_imm(dev, inbox->dma, &vhcr->out_param,
4383                            vhcr->in_modifier, 0,
4384                            MLX4_QP_FLOW_STEERING_ATTACH, MLX4_CMD_TIME_CLASS_A,
4385                            MLX4_CMD_NATIVE);
4386         if (err)
4387                 goto err_put_qp;
4388
4389
4390         err = add_res_range(dev, slave, vhcr->out_param, 1, RES_FS_RULE, qpn);
4391         if (err) {
4392                 mlx4_err(dev, "Fail to add flow steering resources\n");
4393                 goto err_detach;
4394         }
4395
4396         err = get_res(dev, slave, vhcr->out_param, RES_FS_RULE, &rrule);
4397         if (err)
4398                 goto err_detach;
4399
4400         mbox_size = qp_attach_mbox_size(inbox->buf);
4401         rrule->mirr_mbox = kmalloc(mbox_size, GFP_KERNEL);
4402         if (!rrule->mirr_mbox) {
4403                 err = -ENOMEM;
4404                 goto err_put_rule;
4405         }
4406         rrule->mirr_mbox_size = mbox_size;
4407         rrule->mirr_rule_id = 0;
4408         memcpy(rrule->mirr_mbox, inbox->buf, mbox_size);
4409
4410         /* set different port */
4411         ctrl = (struct mlx4_net_trans_rule_hw_ctrl *)rrule->mirr_mbox;
4412         if (ctrl->port == 1)
4413                 ctrl->port = 2;
4414         else
4415                 ctrl->port = 1;
4416
4417         if (mlx4_is_bonded(dev))
4418                 mlx4_do_mirror_rule(dev, rrule);
4419
4420         atomic_inc(&rqp->ref_count);
4421
4422 err_put_rule:
4423         put_res(dev, slave, vhcr->out_param, RES_FS_RULE);
4424 err_detach:
4425         /* detach rule on error */
4426         if (err)
4427                 mlx4_cmd(dev, vhcr->out_param, 0, 0,
4428                          MLX4_QP_FLOW_STEERING_DETACH, MLX4_CMD_TIME_CLASS_A,
4429                          MLX4_CMD_NATIVE);
4430 err_put_qp:
4431         put_res(dev, slave, qpn, RES_QP);
4432         return err;
4433 }
4434
4435 static int mlx4_undo_mirror_rule(struct mlx4_dev *dev, struct res_fs_rule *fs_rule)
4436 {
4437         int err;
4438
4439         err = rem_res_range(dev, fs_rule->com.owner, fs_rule->com.res_id, 1, RES_FS_RULE, 0);
4440         if (err) {
4441                 mlx4_err(dev, "Fail to remove flow steering resources\n");
4442                 return err;
4443         }
4444
4445         mlx4_cmd(dev, fs_rule->com.res_id, 0, 0, MLX4_QP_FLOW_STEERING_DETACH,
4446                  MLX4_CMD_TIME_CLASS_A, MLX4_CMD_NATIVE);
4447         return 0;
4448 }
4449
4450 int mlx4_QP_FLOW_STEERING_DETACH_wrapper(struct mlx4_dev *dev, int slave,
4451                                          struct mlx4_vhcr *vhcr,
4452                                          struct mlx4_cmd_mailbox *inbox,
4453                                          struct mlx4_cmd_mailbox *outbox,
4454                                          struct mlx4_cmd_info *cmd)
4455 {
4456         int err;
4457         struct res_qp *rqp;
4458         struct res_fs_rule *rrule;
4459         u64 mirr_reg_id;
4460
4461         if (dev->caps.steering_mode !=
4462             MLX4_STEERING_MODE_DEVICE_MANAGED)
4463                 return -EOPNOTSUPP;
4464
4465         err = get_res(dev, slave, vhcr->in_param, RES_FS_RULE, &rrule);
4466         if (err)
4467                 return err;
4468
4469         if (!rrule->mirr_mbox) {
4470                 mlx4_err(dev, "Mirror rules cannot be removed explicitly\n");
4471                 put_res(dev, slave, vhcr->in_param, RES_FS_RULE);
4472                 return -EINVAL;
4473         }
4474         mirr_reg_id = rrule->mirr_rule_id;
4475         kfree(rrule->mirr_mbox);
4476
4477         /* Release the rule form busy state before removal */
4478         put_res(dev, slave, vhcr->in_param, RES_FS_RULE);
4479         err = get_res(dev, slave, rrule->qpn, RES_QP, &rqp);
4480         if (err)
4481                 return err;
4482
4483         if (mirr_reg_id && mlx4_is_bonded(dev)) {
4484                 err = get_res(dev, slave, mirr_reg_id, RES_FS_RULE, &rrule);
4485                 if (err) {
4486                         mlx4_err(dev, "Fail to get resource of mirror rule\n");
4487                 } else {
4488                         put_res(dev, slave, mirr_reg_id, RES_FS_RULE);
4489                         mlx4_undo_mirror_rule(dev, rrule);
4490                 }
4491         }
4492         err = rem_res_range(dev, slave, vhcr->in_param, 1, RES_FS_RULE, 0);
4493         if (err) {
4494                 mlx4_err(dev, "Fail to remove flow steering resources\n");
4495                 goto out;
4496         }
4497
4498         err = mlx4_cmd(dev, vhcr->in_param, 0, 0,
4499                        MLX4_QP_FLOW_STEERING_DETACH, MLX4_CMD_TIME_CLASS_A,
4500                        MLX4_CMD_NATIVE);
4501         if (!err)
4502                 atomic_dec(&rqp->ref_count);
4503 out:
4504         put_res(dev, slave, rrule->qpn, RES_QP);
4505         return err;
4506 }
4507
4508 enum {
4509         BUSY_MAX_RETRIES = 10
4510 };
4511
4512 int mlx4_QUERY_IF_STAT_wrapper(struct mlx4_dev *dev, int slave,
4513                                struct mlx4_vhcr *vhcr,
4514                                struct mlx4_cmd_mailbox *inbox,
4515                                struct mlx4_cmd_mailbox *outbox,
4516                                struct mlx4_cmd_info *cmd)
4517 {
4518         int err;
4519         int index = vhcr->in_modifier & 0xffff;
4520
4521         err = get_res(dev, slave, index, RES_COUNTER, NULL);
4522         if (err)
4523                 return err;
4524
4525         err = mlx4_DMA_wrapper(dev, slave, vhcr, inbox, outbox, cmd);
4526         put_res(dev, slave, index, RES_COUNTER);
4527         return err;
4528 }
4529
4530 static void detach_qp(struct mlx4_dev *dev, int slave, struct res_qp *rqp)
4531 {
4532         struct res_gid *rgid;
4533         struct res_gid *tmp;
4534         struct mlx4_qp qp; /* dummy for calling attach/detach */
4535
4536         list_for_each_entry_safe(rgid, tmp, &rqp->mcg_list, list) {
4537                 switch (dev->caps.steering_mode) {
4538                 case MLX4_STEERING_MODE_DEVICE_MANAGED:
4539                         mlx4_flow_detach(dev, rgid->reg_id);
4540                         break;
4541                 case MLX4_STEERING_MODE_B0:
4542                         qp.qpn = rqp->local_qpn;
4543                         (void) mlx4_qp_detach_common(dev, &qp, rgid->gid,
4544                                                      rgid->prot, rgid->steer);
4545                         break;
4546                 }
4547                 list_del(&rgid->list);
4548                 kfree(rgid);
4549         }
4550 }
4551
4552 static int _move_all_busy(struct mlx4_dev *dev, int slave,
4553                           enum mlx4_resource type, int print)
4554 {
4555         struct mlx4_priv *priv = mlx4_priv(dev);
4556         struct mlx4_resource_tracker *tracker =
4557                 &priv->mfunc.master.res_tracker;
4558         struct list_head *rlist = &tracker->slave_list[slave].res_list[type];
4559         struct res_common *r;
4560         struct res_common *tmp;
4561         int busy;
4562
4563         busy = 0;
4564         spin_lock_irq(mlx4_tlock(dev));
4565         list_for_each_entry_safe(r, tmp, rlist, list) {
4566                 if (r->owner == slave) {
4567                         if (!r->removing) {
4568                                 if (r->state == RES_ANY_BUSY) {
4569                                         if (print)
4570                                                 mlx4_dbg(dev,
4571                                                          "%s id 0x%llx is busy\n",
4572                                                           resource_str(type),
4573                                                           r->res_id);
4574                                         ++busy;
4575                                 } else {
4576                                         r->from_state = r->state;
4577                                         r->state = RES_ANY_BUSY;
4578                                         r->removing = 1;
4579                                 }
4580                         }
4581                 }
4582         }
4583         spin_unlock_irq(mlx4_tlock(dev));
4584
4585         return busy;
4586 }
4587
4588 static int move_all_busy(struct mlx4_dev *dev, int slave,
4589                          enum mlx4_resource type)
4590 {
4591         unsigned long begin;
4592         int busy;
4593
4594         begin = jiffies;
4595         do {
4596                 busy = _move_all_busy(dev, slave, type, 0);
4597                 if (time_after(jiffies, begin + 5 * HZ))
4598                         break;
4599                 if (busy)
4600                         cond_resched();
4601         } while (busy);
4602
4603         if (busy)
4604                 busy = _move_all_busy(dev, slave, type, 1);
4605
4606         return busy;
4607 }
4608 static void rem_slave_qps(struct mlx4_dev *dev, int slave)
4609 {
4610         struct mlx4_priv *priv = mlx4_priv(dev);
4611         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
4612         struct list_head *qp_list =
4613                 &tracker->slave_list[slave].res_list[RES_QP];
4614         struct res_qp *qp;
4615         struct res_qp *tmp;
4616         int state;
4617         u64 in_param;
4618         int qpn;
4619         int err;
4620
4621         err = move_all_busy(dev, slave, RES_QP);
4622         if (err)
4623                 mlx4_warn(dev, "rem_slave_qps: Could not move all qps to busy for slave %d\n",
4624                           slave);
4625
4626         spin_lock_irq(mlx4_tlock(dev));
4627         list_for_each_entry_safe(qp, tmp, qp_list, com.list) {
4628                 spin_unlock_irq(mlx4_tlock(dev));
4629                 if (qp->com.owner == slave) {
4630                         qpn = qp->com.res_id;
4631                         detach_qp(dev, slave, qp);
4632                         state = qp->com.from_state;
4633                         while (state != 0) {
4634                                 switch (state) {
4635                                 case RES_QP_RESERVED:
4636                                         spin_lock_irq(mlx4_tlock(dev));
4637                                         rb_erase(&qp->com.node,
4638                                                  &tracker->res_tree[RES_QP]);
4639                                         list_del(&qp->com.list);
4640                                         spin_unlock_irq(mlx4_tlock(dev));
4641                                         if (!valid_reserved(dev, slave, qpn)) {
4642                                                 __mlx4_qp_release_range(dev, qpn, 1);
4643                                                 mlx4_release_resource(dev, slave,
4644                                                                       RES_QP, 1, 0);
4645                                         }
4646                                         kfree(qp);
4647                                         state = 0;
4648                                         break;
4649                                 case RES_QP_MAPPED:
4650                                         if (!valid_reserved(dev, slave, qpn))
4651                                                 __mlx4_qp_free_icm(dev, qpn);
4652                                         state = RES_QP_RESERVED;
4653                                         break;
4654                                 case RES_QP_HW:
4655                                         in_param = slave;
4656                                         err = mlx4_cmd(dev, in_param,
4657                                                        qp->local_qpn, 2,
4658                                                        MLX4_CMD_2RST_QP,
4659                                                        MLX4_CMD_TIME_CLASS_A,
4660                                                        MLX4_CMD_NATIVE);
4661                                         if (err)
4662                                                 mlx4_dbg(dev, "rem_slave_qps: failed to move slave %d qpn %d to reset\n",
4663                                                          slave, qp->local_qpn);
4664                                         atomic_dec(&qp->rcq->ref_count);
4665                                         atomic_dec(&qp->scq->ref_count);
4666                                         atomic_dec(&qp->mtt->ref_count);
4667                                         if (qp->srq)
4668                                                 atomic_dec(&qp->srq->ref_count);
4669                                         state = RES_QP_MAPPED;
4670                                         break;
4671                                 default:
4672                                         state = 0;
4673                                 }
4674                         }
4675                 }
4676                 spin_lock_irq(mlx4_tlock(dev));
4677         }
4678         spin_unlock_irq(mlx4_tlock(dev));
4679 }
4680
4681 static void rem_slave_srqs(struct mlx4_dev *dev, int slave)
4682 {
4683         struct mlx4_priv *priv = mlx4_priv(dev);
4684         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
4685         struct list_head *srq_list =
4686                 &tracker->slave_list[slave].res_list[RES_SRQ];
4687         struct res_srq *srq;
4688         struct res_srq *tmp;
4689         int state;
4690         u64 in_param;
4691         LIST_HEAD(tlist);
4692         int srqn;
4693         int err;
4694
4695         err = move_all_busy(dev, slave, RES_SRQ);
4696         if (err)
4697                 mlx4_warn(dev, "rem_slave_srqs: Could not move all srqs - too busy for slave %d\n",
4698                           slave);
4699
4700         spin_lock_irq(mlx4_tlock(dev));
4701         list_for_each_entry_safe(srq, tmp, srq_list, com.list) {
4702                 spin_unlock_irq(mlx4_tlock(dev));
4703                 if (srq->com.owner == slave) {
4704                         srqn = srq->com.res_id;
4705                         state = srq->com.from_state;
4706                         while (state != 0) {
4707                                 switch (state) {
4708                                 case RES_SRQ_ALLOCATED:
4709                                         __mlx4_srq_free_icm(dev, srqn);
4710                                         spin_lock_irq(mlx4_tlock(dev));
4711                                         rb_erase(&srq->com.node,
4712                                                  &tracker->res_tree[RES_SRQ]);
4713                                         list_del(&srq->com.list);
4714                                         spin_unlock_irq(mlx4_tlock(dev));
4715                                         mlx4_release_resource(dev, slave,
4716                                                               RES_SRQ, 1, 0);
4717                                         kfree(srq);
4718                                         state = 0;
4719                                         break;
4720
4721                                 case RES_SRQ_HW:
4722                                         in_param = slave;
4723                                         err = mlx4_cmd(dev, in_param, srqn, 1,
4724                                                        MLX4_CMD_HW2SW_SRQ,
4725                                                        MLX4_CMD_TIME_CLASS_A,
4726                                                        MLX4_CMD_NATIVE);
4727                                         if (err)
4728                                                 mlx4_dbg(dev, "rem_slave_srqs: failed to move slave %d srq %d to SW ownership\n",
4729                                                          slave, srqn);
4730
4731                                         atomic_dec(&srq->mtt->ref_count);
4732                                         if (srq->cq)
4733                                                 atomic_dec(&srq->cq->ref_count);
4734                                         state = RES_SRQ_ALLOCATED;
4735                                         break;
4736
4737                                 default:
4738                                         state = 0;
4739                                 }
4740                         }
4741                 }
4742                 spin_lock_irq(mlx4_tlock(dev));
4743         }
4744         spin_unlock_irq(mlx4_tlock(dev));
4745 }
4746
4747 static void rem_slave_cqs(struct mlx4_dev *dev, int slave)
4748 {
4749         struct mlx4_priv *priv = mlx4_priv(dev);
4750         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
4751         struct list_head *cq_list =
4752                 &tracker->slave_list[slave].res_list[RES_CQ];
4753         struct res_cq *cq;
4754         struct res_cq *tmp;
4755         int state;
4756         u64 in_param;
4757         LIST_HEAD(tlist);
4758         int cqn;
4759         int err;
4760
4761         err = move_all_busy(dev, slave, RES_CQ);
4762         if (err)
4763                 mlx4_warn(dev, "rem_slave_cqs: Could not move all cqs - too busy for slave %d\n",
4764                           slave);
4765
4766         spin_lock_irq(mlx4_tlock(dev));
4767         list_for_each_entry_safe(cq, tmp, cq_list, com.list) {
4768                 spin_unlock_irq(mlx4_tlock(dev));
4769                 if (cq->com.owner == slave && !atomic_read(&cq->ref_count)) {
4770                         cqn = cq->com.res_id;
4771                         state = cq->com.from_state;
4772                         while (state != 0) {
4773                                 switch (state) {
4774                                 case RES_CQ_ALLOCATED:
4775                                         __mlx4_cq_free_icm(dev, cqn);
4776                                         spin_lock_irq(mlx4_tlock(dev));
4777                                         rb_erase(&cq->com.node,
4778                                                  &tracker->res_tree[RES_CQ]);
4779                                         list_del(&cq->com.list);
4780                                         spin_unlock_irq(mlx4_tlock(dev));
4781                                         mlx4_release_resource(dev, slave,
4782                                                               RES_CQ, 1, 0);
4783                                         kfree(cq);
4784                                         state = 0;
4785                                         break;
4786
4787                                 case RES_CQ_HW:
4788                                         in_param = slave;
4789                                         err = mlx4_cmd(dev, in_param, cqn, 1,
4790                                                        MLX4_CMD_HW2SW_CQ,
4791                                                        MLX4_CMD_TIME_CLASS_A,
4792                                                        MLX4_CMD_NATIVE);
4793                                         if (err)
4794                                                 mlx4_dbg(dev, "rem_slave_cqs: failed to move slave %d cq %d to SW ownership\n",
4795                                                          slave, cqn);
4796                                         atomic_dec(&cq->mtt->ref_count);
4797                                         state = RES_CQ_ALLOCATED;
4798                                         break;
4799
4800                                 default:
4801                                         state = 0;
4802                                 }
4803                         }
4804                 }
4805                 spin_lock_irq(mlx4_tlock(dev));
4806         }
4807         spin_unlock_irq(mlx4_tlock(dev));
4808 }
4809
4810 static void rem_slave_mrs(struct mlx4_dev *dev, int slave)
4811 {
4812         struct mlx4_priv *priv = mlx4_priv(dev);
4813         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
4814         struct list_head *mpt_list =
4815                 &tracker->slave_list[slave].res_list[RES_MPT];
4816         struct res_mpt *mpt;
4817         struct res_mpt *tmp;
4818         int state;
4819         u64 in_param;
4820         LIST_HEAD(tlist);
4821         int mptn;
4822         int err;
4823
4824         err = move_all_busy(dev, slave, RES_MPT);
4825         if (err)
4826                 mlx4_warn(dev, "rem_slave_mrs: Could not move all mpts - too busy for slave %d\n",
4827                           slave);
4828
4829         spin_lock_irq(mlx4_tlock(dev));
4830         list_for_each_entry_safe(mpt, tmp, mpt_list, com.list) {
4831                 spin_unlock_irq(mlx4_tlock(dev));
4832                 if (mpt->com.owner == slave) {
4833                         mptn = mpt->com.res_id;
4834                         state = mpt->com.from_state;
4835                         while (state != 0) {
4836                                 switch (state) {
4837                                 case RES_MPT_RESERVED:
4838                                         __mlx4_mpt_release(dev, mpt->key);
4839                                         spin_lock_irq(mlx4_tlock(dev));
4840                                         rb_erase(&mpt->com.node,
4841                                                  &tracker->res_tree[RES_MPT]);
4842                                         list_del(&mpt->com.list);
4843                                         spin_unlock_irq(mlx4_tlock(dev));
4844                                         mlx4_release_resource(dev, slave,
4845                                                               RES_MPT, 1, 0);
4846                                         kfree(mpt);
4847                                         state = 0;
4848                                         break;
4849
4850                                 case RES_MPT_MAPPED:
4851                                         __mlx4_mpt_free_icm(dev, mpt->key);
4852                                         state = RES_MPT_RESERVED;
4853                                         break;
4854
4855                                 case RES_MPT_HW:
4856                                         in_param = slave;
4857                                         err = mlx4_cmd(dev, in_param, mptn, 0,
4858                                                      MLX4_CMD_HW2SW_MPT,
4859                                                      MLX4_CMD_TIME_CLASS_A,
4860                                                      MLX4_CMD_NATIVE);
4861                                         if (err)
4862                                                 mlx4_dbg(dev, "rem_slave_mrs: failed to move slave %d mpt %d to SW ownership\n",
4863                                                          slave, mptn);
4864                                         if (mpt->mtt)
4865                                                 atomic_dec(&mpt->mtt->ref_count);
4866                                         state = RES_MPT_MAPPED;
4867                                         break;
4868                                 default:
4869                                         state = 0;
4870                                 }
4871                         }
4872                 }
4873                 spin_lock_irq(mlx4_tlock(dev));
4874         }
4875         spin_unlock_irq(mlx4_tlock(dev));
4876 }
4877
4878 static void rem_slave_mtts(struct mlx4_dev *dev, int slave)
4879 {
4880         struct mlx4_priv *priv = mlx4_priv(dev);
4881         struct mlx4_resource_tracker *tracker =
4882                 &priv->mfunc.master.res_tracker;
4883         struct list_head *mtt_list =
4884                 &tracker->slave_list[slave].res_list[RES_MTT];
4885         struct res_mtt *mtt;
4886         struct res_mtt *tmp;
4887         int state;
4888         LIST_HEAD(tlist);
4889         int base;
4890         int err;
4891
4892         err = move_all_busy(dev, slave, RES_MTT);
4893         if (err)
4894                 mlx4_warn(dev, "rem_slave_mtts: Could not move all mtts  - too busy for slave %d\n",
4895                           slave);
4896
4897         spin_lock_irq(mlx4_tlock(dev));
4898         list_for_each_entry_safe(mtt, tmp, mtt_list, com.list) {
4899                 spin_unlock_irq(mlx4_tlock(dev));
4900                 if (mtt->com.owner == slave) {
4901                         base = mtt->com.res_id;
4902                         state = mtt->com.from_state;
4903                         while (state != 0) {
4904                                 switch (state) {
4905                                 case RES_MTT_ALLOCATED:
4906                                         __mlx4_free_mtt_range(dev, base,
4907                                                               mtt->order);
4908                                         spin_lock_irq(mlx4_tlock(dev));
4909                                         rb_erase(&mtt->com.node,
4910                                                  &tracker->res_tree[RES_MTT]);
4911                                         list_del(&mtt->com.list);
4912                                         spin_unlock_irq(mlx4_tlock(dev));
4913                                         mlx4_release_resource(dev, slave, RES_MTT,
4914                                                               1 << mtt->order, 0);
4915                                         kfree(mtt);
4916                                         state = 0;
4917                                         break;
4918
4919                                 default:
4920                                         state = 0;
4921                                 }
4922                         }
4923                 }
4924                 spin_lock_irq(mlx4_tlock(dev));
4925         }
4926         spin_unlock_irq(mlx4_tlock(dev));
4927 }
4928
4929 static int mlx4_do_mirror_rule(struct mlx4_dev *dev, struct res_fs_rule *fs_rule)
4930 {
4931         struct mlx4_cmd_mailbox *mailbox;
4932         int err;
4933         struct res_fs_rule *mirr_rule;
4934         u64 reg_id;
4935
4936         mailbox = mlx4_alloc_cmd_mailbox(dev);
4937         if (IS_ERR(mailbox))
4938                 return PTR_ERR(mailbox);
4939
4940         if (!fs_rule->mirr_mbox) {
4941                 mlx4_err(dev, "rule mirroring mailbox is null\n");
4942                 return -EINVAL;
4943         }
4944         memcpy(mailbox->buf, fs_rule->mirr_mbox, fs_rule->mirr_mbox_size);
4945         err = mlx4_cmd_imm(dev, mailbox->dma, &reg_id, fs_rule->mirr_mbox_size >> 2, 0,
4946                            MLX4_QP_FLOW_STEERING_ATTACH, MLX4_CMD_TIME_CLASS_A,
4947                            MLX4_CMD_NATIVE);
4948         mlx4_free_cmd_mailbox(dev, mailbox);
4949
4950         if (err)
4951                 goto err;
4952
4953         err = add_res_range(dev, fs_rule->com.owner, reg_id, 1, RES_FS_RULE, fs_rule->qpn);
4954         if (err)
4955                 goto err_detach;
4956
4957         err = get_res(dev, fs_rule->com.owner, reg_id, RES_FS_RULE, &mirr_rule);
4958         if (err)
4959                 goto err_rem;
4960
4961         fs_rule->mirr_rule_id = reg_id;
4962         mirr_rule->mirr_rule_id = 0;
4963         mirr_rule->mirr_mbox_size = 0;
4964         mirr_rule->mirr_mbox = NULL;
4965         put_res(dev, fs_rule->com.owner, reg_id, RES_FS_RULE);
4966
4967         return 0;
4968 err_rem:
4969         rem_res_range(dev, fs_rule->com.owner, reg_id, 1, RES_FS_RULE, 0);
4970 err_detach:
4971         mlx4_cmd(dev, reg_id, 0, 0, MLX4_QP_FLOW_STEERING_DETACH,
4972                  MLX4_CMD_TIME_CLASS_A, MLX4_CMD_NATIVE);
4973 err:
4974         return err;
4975 }
4976
4977 static int mlx4_mirror_fs_rules(struct mlx4_dev *dev, bool bond)
4978 {
4979         struct mlx4_priv *priv = mlx4_priv(dev);
4980         struct mlx4_resource_tracker *tracker =
4981                 &priv->mfunc.master.res_tracker;
4982         struct rb_root *root = &tracker->res_tree[RES_FS_RULE];
4983         struct rb_node *p;
4984         struct res_fs_rule *fs_rule;
4985         int err = 0;
4986         LIST_HEAD(mirr_list);
4987
4988         for (p = rb_first(root); p; p = rb_next(p)) {
4989                 fs_rule = rb_entry(p, struct res_fs_rule, com.node);
4990                 if ((bond && fs_rule->mirr_mbox_size) ||
4991                     (!bond && !fs_rule->mirr_mbox_size))
4992                         list_add_tail(&fs_rule->mirr_list, &mirr_list);
4993         }
4994
4995         list_for_each_entry(fs_rule, &mirr_list, mirr_list) {
4996                 if (bond)
4997                         err += mlx4_do_mirror_rule(dev, fs_rule);
4998                 else
4999                         err += mlx4_undo_mirror_rule(dev, fs_rule);
5000         }
5001         return err;
5002 }
5003
5004 int mlx4_bond_fs_rules(struct mlx4_dev *dev)
5005 {
5006         return mlx4_mirror_fs_rules(dev, true);
5007 }
5008
5009 int mlx4_unbond_fs_rules(struct mlx4_dev *dev)
5010 {
5011         return mlx4_mirror_fs_rules(dev, false);
5012 }
5013
5014 static void rem_slave_fs_rule(struct mlx4_dev *dev, int slave)
5015 {
5016         struct mlx4_priv *priv = mlx4_priv(dev);
5017         struct mlx4_resource_tracker *tracker =
5018                 &priv->mfunc.master.res_tracker;
5019         struct list_head *fs_rule_list =
5020                 &tracker->slave_list[slave].res_list[RES_FS_RULE];
5021         struct res_fs_rule *fs_rule;
5022         struct res_fs_rule *tmp;
5023         int state;
5024         u64 base;
5025         int err;
5026
5027         err = move_all_busy(dev, slave, RES_FS_RULE);
5028         if (err)
5029                 mlx4_warn(dev, "rem_slave_fs_rule: Could not move all mtts to busy for slave %d\n",
5030                           slave);
5031
5032         spin_lock_irq(mlx4_tlock(dev));
5033         list_for_each_entry_safe(fs_rule, tmp, fs_rule_list, com.list) {
5034                 spin_unlock_irq(mlx4_tlock(dev));
5035                 if (fs_rule->com.owner == slave) {
5036                         base = fs_rule->com.res_id;
5037                         state = fs_rule->com.from_state;
5038                         while (state != 0) {
5039                                 switch (state) {
5040                                 case RES_FS_RULE_ALLOCATED:
5041                                         /* detach rule */
5042                                         err = mlx4_cmd(dev, base, 0, 0,
5043                                                        MLX4_QP_FLOW_STEERING_DETACH,
5044                                                        MLX4_CMD_TIME_CLASS_A,
5045                                                        MLX4_CMD_NATIVE);
5046
5047                                         spin_lock_irq(mlx4_tlock(dev));
5048                                         rb_erase(&fs_rule->com.node,
5049                                                  &tracker->res_tree[RES_FS_RULE]);
5050                                         list_del(&fs_rule->com.list);
5051                                         spin_unlock_irq(mlx4_tlock(dev));
5052                                         kfree(fs_rule);
5053                                         state = 0;
5054                                         break;
5055
5056                                 default:
5057                                         state = 0;
5058                                 }
5059                         }
5060                 }
5061                 spin_lock_irq(mlx4_tlock(dev));
5062         }
5063         spin_unlock_irq(mlx4_tlock(dev));
5064 }
5065
5066 static void rem_slave_eqs(struct mlx4_dev *dev, int slave)
5067 {
5068         struct mlx4_priv *priv = mlx4_priv(dev);
5069         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
5070         struct list_head *eq_list =
5071                 &tracker->slave_list[slave].res_list[RES_EQ];
5072         struct res_eq *eq;
5073         struct res_eq *tmp;
5074         int err;
5075         int state;
5076         LIST_HEAD(tlist);
5077         int eqn;
5078
5079         err = move_all_busy(dev, slave, RES_EQ);
5080         if (err)
5081                 mlx4_warn(dev, "rem_slave_eqs: Could not move all eqs - too busy for slave %d\n",
5082                           slave);
5083
5084         spin_lock_irq(mlx4_tlock(dev));
5085         list_for_each_entry_safe(eq, tmp, eq_list, com.list) {
5086                 spin_unlock_irq(mlx4_tlock(dev));
5087                 if (eq->com.owner == slave) {
5088                         eqn = eq->com.res_id;
5089                         state = eq->com.from_state;
5090                         while (state != 0) {
5091                                 switch (state) {
5092                                 case RES_EQ_RESERVED:
5093                                         spin_lock_irq(mlx4_tlock(dev));
5094                                         rb_erase(&eq->com.node,
5095                                                  &tracker->res_tree[RES_EQ]);
5096                                         list_del(&eq->com.list);
5097                                         spin_unlock_irq(mlx4_tlock(dev));
5098                                         kfree(eq);
5099                                         state = 0;
5100                                         break;
5101
5102                                 case RES_EQ_HW:
5103                                         err = mlx4_cmd(dev, slave, eqn & 0x3ff,
5104                                                        1, MLX4_CMD_HW2SW_EQ,
5105                                                        MLX4_CMD_TIME_CLASS_A,
5106                                                        MLX4_CMD_NATIVE);
5107                                         if (err)
5108                                                 mlx4_dbg(dev, "rem_slave_eqs: failed to move slave %d eqs %d to SW ownership\n",
5109                                                          slave, eqn & 0x3ff);
5110                                         atomic_dec(&eq->mtt->ref_count);
5111                                         state = RES_EQ_RESERVED;
5112                                         break;
5113
5114                                 default:
5115                                         state = 0;
5116                                 }
5117                         }
5118                 }
5119                 spin_lock_irq(mlx4_tlock(dev));
5120         }
5121         spin_unlock_irq(mlx4_tlock(dev));
5122 }
5123
5124 static void rem_slave_counters(struct mlx4_dev *dev, int slave)
5125 {
5126         struct mlx4_priv *priv = mlx4_priv(dev);
5127         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
5128         struct list_head *counter_list =
5129                 &tracker->slave_list[slave].res_list[RES_COUNTER];
5130         struct res_counter *counter;
5131         struct res_counter *tmp;
5132         int err;
5133         int *counters_arr = NULL;
5134         int i, j;
5135
5136         err = move_all_busy(dev, slave, RES_COUNTER);
5137         if (err)
5138                 mlx4_warn(dev, "rem_slave_counters: Could not move all counters - too busy for slave %d\n",
5139                           slave);
5140
5141         counters_arr = kmalloc_array(dev->caps.max_counters,
5142                                      sizeof(*counters_arr), GFP_KERNEL);
5143         if (!counters_arr)
5144                 return;
5145
5146         do {
5147                 i = 0;
5148                 j = 0;
5149                 spin_lock_irq(mlx4_tlock(dev));
5150                 list_for_each_entry_safe(counter, tmp, counter_list, com.list) {
5151                         if (counter->com.owner == slave) {
5152                                 counters_arr[i++] = counter->com.res_id;
5153                                 rb_erase(&counter->com.node,
5154                                          &tracker->res_tree[RES_COUNTER]);
5155                                 list_del(&counter->com.list);
5156                                 kfree(counter);
5157                         }
5158                 }
5159                 spin_unlock_irq(mlx4_tlock(dev));
5160
5161                 while (j < i) {
5162                         __mlx4_counter_free(dev, counters_arr[j++]);
5163                         mlx4_release_resource(dev, slave, RES_COUNTER, 1, 0);
5164                 }
5165         } while (i);
5166
5167         kfree(counters_arr);
5168 }
5169
5170 static void rem_slave_xrcdns(struct mlx4_dev *dev, int slave)
5171 {
5172         struct mlx4_priv *priv = mlx4_priv(dev);
5173         struct mlx4_resource_tracker *tracker = &priv->mfunc.master.res_tracker;
5174         struct list_head *xrcdn_list =
5175                 &tracker->slave_list[slave].res_list[RES_XRCD];
5176         struct res_xrcdn *xrcd;
5177         struct res_xrcdn *tmp;
5178         int err;
5179         int xrcdn;
5180
5181         err = move_all_busy(dev, slave, RES_XRCD);
5182         if (err)
5183                 mlx4_warn(dev, "rem_slave_xrcdns: Could not move all xrcdns - too busy for slave %d\n",
5184                           slave);
5185
5186         spin_lock_irq(mlx4_tlock(dev));
5187         list_for_each_entry_safe(xrcd, tmp, xrcdn_list, com.list) {
5188                 if (xrcd->com.owner == slave) {
5189                         xrcdn = xrcd->com.res_id;
5190                         rb_erase(&xrcd->com.node, &tracker->res_tree[RES_XRCD]);
5191                         list_del(&xrcd->com.list);
5192                         kfree(xrcd);
5193                         __mlx4_xrcd_free(dev, xrcdn);
5194                 }
5195         }
5196         spin_unlock_irq(mlx4_tlock(dev));
5197 }
5198
5199 void mlx4_delete_all_resources_for_slave(struct mlx4_dev *dev, int slave)
5200 {
5201         struct mlx4_priv *priv = mlx4_priv(dev);
5202         mlx4_reset_roce_gids(dev, slave);
5203         mutex_lock(&priv->mfunc.master.res_tracker.slave_list[slave].mutex);
5204         rem_slave_vlans(dev, slave);
5205         rem_slave_macs(dev, slave);
5206         rem_slave_fs_rule(dev, slave);
5207         rem_slave_qps(dev, slave);
5208         rem_slave_srqs(dev, slave);
5209         rem_slave_cqs(dev, slave);
5210         rem_slave_mrs(dev, slave);
5211         rem_slave_eqs(dev, slave);
5212         rem_slave_mtts(dev, slave);
5213         rem_slave_counters(dev, slave);
5214         rem_slave_xrcdns(dev, slave);
5215         mutex_unlock(&priv->mfunc.master.res_tracker.slave_list[slave].mutex);
5216 }
5217
5218 void mlx4_vf_immed_vlan_work_handler(struct work_struct *_work)
5219 {
5220         struct mlx4_vf_immed_vlan_work *work =
5221                 container_of(_work, struct mlx4_vf_immed_vlan_work, work);
5222         struct mlx4_cmd_mailbox *mailbox;
5223         struct mlx4_update_qp_context *upd_context;
5224         struct mlx4_dev *dev = &work->priv->dev;
5225         struct mlx4_resource_tracker *tracker =
5226                 &work->priv->mfunc.master.res_tracker;
5227         struct list_head *qp_list =
5228                 &tracker->slave_list[work->slave].res_list[RES_QP];
5229         struct res_qp *qp;
5230         struct res_qp *tmp;
5231         u64 qp_path_mask_vlan_ctrl =
5232                        ((1ULL << MLX4_UPD_QP_PATH_MASK_ETH_TX_BLOCK_UNTAGGED) |
5233                        (1ULL << MLX4_UPD_QP_PATH_MASK_ETH_TX_BLOCK_1P) |
5234                        (1ULL << MLX4_UPD_QP_PATH_MASK_ETH_TX_BLOCK_TAGGED) |
5235                        (1ULL << MLX4_UPD_QP_PATH_MASK_ETH_RX_BLOCK_UNTAGGED) |
5236                        (1ULL << MLX4_UPD_QP_PATH_MASK_ETH_RX_BLOCK_1P) |
5237                        (1ULL << MLX4_UPD_QP_PATH_MASK_ETH_RX_BLOCK_TAGGED));
5238
5239         u64 qp_path_mask = ((1ULL << MLX4_UPD_QP_PATH_MASK_VLAN_INDEX) |
5240                        (1ULL << MLX4_UPD_QP_PATH_MASK_FVL) |
5241                        (1ULL << MLX4_UPD_QP_PATH_MASK_CV) |
5242                        (1ULL << MLX4_UPD_QP_PATH_MASK_ETH_HIDE_CQE_VLAN) |
5243                        (1ULL << MLX4_UPD_QP_PATH_MASK_FEUP) |
5244                        (1ULL << MLX4_UPD_QP_PATH_MASK_FVL_RX) |
5245                        (1ULL << MLX4_UPD_QP_PATH_MASK_SCHED_QUEUE));
5246
5247         int err;
5248         int port, errors = 0;
5249         u8 vlan_control;
5250
5251         if (mlx4_is_slave(dev)) {
5252                 mlx4_warn(dev, "Trying to update-qp in slave %d\n",
5253                           work->slave);
5254                 goto out;
5255         }
5256
5257         mailbox = mlx4_alloc_cmd_mailbox(dev);
5258         if (IS_ERR(mailbox))
5259                 goto out;
5260         if (work->flags & MLX4_VF_IMMED_VLAN_FLAG_LINK_DISABLE) /* block all */
5261                 vlan_control = MLX4_VLAN_CTRL_ETH_TX_BLOCK_TAGGED |
5262                         MLX4_VLAN_CTRL_ETH_TX_BLOCK_PRIO_TAGGED |
5263                         MLX4_VLAN_CTRL_ETH_TX_BLOCK_UNTAGGED |
5264                         MLX4_VLAN_CTRL_ETH_RX_BLOCK_PRIO_TAGGED |
5265                         MLX4_VLAN_CTRL_ETH_RX_BLOCK_UNTAGGED |
5266                         MLX4_VLAN_CTRL_ETH_RX_BLOCK_TAGGED;
5267         else if (!work->vlan_id)
5268                 vlan_control = MLX4_VLAN_CTRL_ETH_TX_BLOCK_TAGGED |
5269                         MLX4_VLAN_CTRL_ETH_RX_BLOCK_TAGGED;
5270         else
5271                 vlan_control = MLX4_VLAN_CTRL_ETH_TX_BLOCK_TAGGED |
5272                         MLX4_VLAN_CTRL_ETH_RX_BLOCK_PRIO_TAGGED |
5273                         MLX4_VLAN_CTRL_ETH_RX_BLOCK_UNTAGGED;
5274
5275         upd_context = mailbox->buf;
5276         upd_context->qp_mask = cpu_to_be64(1ULL << MLX4_UPD_QP_MASK_VSD);
5277
5278         spin_lock_irq(mlx4_tlock(dev));
5279         list_for_each_entry_safe(qp, tmp, qp_list, com.list) {
5280                 spin_unlock_irq(mlx4_tlock(dev));
5281                 if (qp->com.owner == work->slave) {
5282                         if (qp->com.from_state != RES_QP_HW ||
5283                             !qp->sched_queue ||  /* no INIT2RTR trans yet */
5284                             mlx4_is_qp_reserved(dev, qp->local_qpn) ||
5285                             qp->qpc_flags & (1 << MLX4_RSS_QPC_FLAG_OFFSET)) {
5286                                 spin_lock_irq(mlx4_tlock(dev));
5287                                 continue;
5288                         }
5289                         port = (qp->sched_queue >> 6 & 1) + 1;
5290                         if (port != work->port) {
5291                                 spin_lock_irq(mlx4_tlock(dev));
5292                                 continue;
5293                         }
5294                         if (MLX4_QP_ST_RC == ((qp->qpc_flags >> 16) & 0xff))
5295                                 upd_context->primary_addr_path_mask = cpu_to_be64(qp_path_mask);
5296                         else
5297                                 upd_context->primary_addr_path_mask =
5298                                         cpu_to_be64(qp_path_mask | qp_path_mask_vlan_ctrl);
5299                         if (work->vlan_id == MLX4_VGT) {
5300                                 upd_context->qp_context.param3 = qp->param3;
5301                                 upd_context->qp_context.pri_path.vlan_control = qp->vlan_control;
5302                                 upd_context->qp_context.pri_path.fvl_rx = qp->fvl_rx;
5303                                 upd_context->qp_context.pri_path.vlan_index = qp->vlan_index;
5304                                 upd_context->qp_context.pri_path.fl = qp->pri_path_fl;
5305                                 upd_context->qp_context.pri_path.feup = qp->feup;
5306                                 upd_context->qp_context.pri_path.sched_queue =
5307                                         qp->sched_queue;
5308                         } else {
5309                                 upd_context->qp_context.param3 = qp->param3 & ~cpu_to_be32(MLX4_STRIP_VLAN);
5310                                 upd_context->qp_context.pri_path.vlan_control = vlan_control;
5311                                 upd_context->qp_context.pri_path.vlan_index = work->vlan_ix;
5312                                 upd_context->qp_context.pri_path.fvl_rx =
5313                                         qp->fvl_rx | MLX4_FVL_RX_FORCE_ETH_VLAN;
5314                                 upd_context->qp_context.pri_path.fl =
5315                                         qp->pri_path_fl | MLX4_FL_CV | MLX4_FL_ETH_HIDE_CQE_VLAN;
5316                                 upd_context->qp_context.pri_path.feup =
5317                                         qp->feup | MLX4_FEUP_FORCE_ETH_UP | MLX4_FVL_FORCE_ETH_VLAN;
5318                                 upd_context->qp_context.pri_path.sched_queue =
5319                                         qp->sched_queue & 0xC7;
5320                                 upd_context->qp_context.pri_path.sched_queue |=
5321                                         ((work->qos & 0x7) << 3);
5322                                 upd_context->qp_mask |=
5323                                         cpu_to_be64(1ULL <<
5324                                                     MLX4_UPD_QP_MASK_QOS_VPP);
5325                                 upd_context->qp_context.qos_vport =
5326                                         work->qos_vport;
5327                         }
5328
5329                         err = mlx4_cmd(dev, mailbox->dma,
5330                                        qp->local_qpn & 0xffffff,
5331                                        0, MLX4_CMD_UPDATE_QP,
5332                                        MLX4_CMD_TIME_CLASS_C, MLX4_CMD_NATIVE);
5333                         if (err) {
5334                                 mlx4_info(dev, "UPDATE_QP failed for slave %d, port %d, qpn %d (%d)\n",
5335                                           work->slave, port, qp->local_qpn, err);
5336                                 errors++;
5337                         }
5338                 }
5339                 spin_lock_irq(mlx4_tlock(dev));
5340         }
5341         spin_unlock_irq(mlx4_tlock(dev));
5342         mlx4_free_cmd_mailbox(dev, mailbox);
5343
5344         if (errors)
5345                 mlx4_err(dev, "%d UPDATE_QP failures for slave %d, port %d\n",
5346                          errors, work->slave, work->port);
5347
5348         /* unregister previous vlan_id if needed and we had no errors
5349          * while updating the QPs
5350          */
5351         if (work->flags & MLX4_VF_IMMED_VLAN_FLAG_VLAN && !errors &&
5352             NO_INDX != work->orig_vlan_ix)
5353                 __mlx4_unregister_vlan(&work->priv->dev, work->port,
5354                                        work->orig_vlan_id);
5355 out:
5356         kfree(work);
5357         return;
5358 }