1 | /* |
2 | * Copyright (c) 2004, 2005 Topspin Communications. All rights reserved. |
3 | * Copyright (c) 2005 Mellanox Technologies. All rights reserved. |
4 | * |
5 | * This software is available to you under a choice of one of two |
6 | * licenses. You may choose to be licensed under the terms of the GNU |
7 | * General Public License (GPL) Version 2, available from the file |
8 | * COPYING in the main directory of this source tree, or the |
9 | * OpenIB.org BSD license below: |
10 | * |
11 | * Redistribution and use in source and binary forms, with or |
12 | * without modification, are permitted provided that the following |
13 | * conditions are met: |
14 | * |
15 | * - Redistributions of source code must retain the above |
16 | * copyright notice, this list of conditions and the following |
17 | * disclaimer. |
18 | * |
19 | * - Redistributions in binary form must reproduce the above |
20 | * copyright notice, this list of conditions and the following |
21 | * disclaimer in the documentation and/or other materials |
22 | * provided with the distribution. |
23 | * |
24 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, |
25 | * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF |
26 | * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND |
27 | * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS |
28 | * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN |
29 | * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN |
30 | * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE |
31 | * SOFTWARE. |
32 | */ |
33 | |
34 | #include <linux/slab.h> |
35 | |
36 | #include "ipoib.h" |
37 | |
38 | int ipoib_mcast_attach(struct net_device *dev, struct ib_device *hca, |
39 | union ib_gid *mgid, u16 mlid, int set_qkey, u32 qkey) |
40 | { |
41 | struct ipoib_dev_priv *priv = ipoib_priv(dev); |
42 | struct ib_qp_attr *qp_attr = NULL; |
43 | int ret; |
44 | u16 pkey_index; |
45 | |
46 | if (ib_find_pkey(device: priv->ca, port_num: priv->port, pkey: priv->pkey, index: &pkey_index)) { |
47 | clear_bit(nr: IPOIB_PKEY_ASSIGNED, addr: &priv->flags); |
48 | ret = -ENXIO; |
49 | goto out; |
50 | } |
51 | set_bit(nr: IPOIB_PKEY_ASSIGNED, addr: &priv->flags); |
52 | |
53 | if (set_qkey) { |
54 | ret = -ENOMEM; |
55 | qp_attr = kmalloc(size: sizeof(*qp_attr), GFP_KERNEL); |
56 | if (!qp_attr) |
57 | goto out; |
58 | |
59 | /* set correct QKey for QP */ |
60 | qp_attr->qkey = qkey; |
61 | ret = ib_modify_qp(qp: priv->qp, qp_attr, qp_attr_mask: IB_QP_QKEY); |
62 | if (ret) { |
63 | ipoib_warn(priv, "failed to modify QP, ret = %d\n" , ret); |
64 | goto out; |
65 | } |
66 | } |
67 | |
68 | /* attach QP to multicast group */ |
69 | ret = ib_attach_mcast(qp: priv->qp, gid: mgid, lid: mlid); |
70 | if (ret) |
71 | ipoib_warn(priv, "failed to attach to multicast group, ret = %d\n" , ret); |
72 | |
73 | out: |
74 | kfree(objp: qp_attr); |
75 | return ret; |
76 | } |
77 | |
78 | int ipoib_mcast_detach(struct net_device *dev, struct ib_device *hca, |
79 | union ib_gid *mgid, u16 mlid) |
80 | { |
81 | struct ipoib_dev_priv *priv = ipoib_priv(dev); |
82 | int ret; |
83 | |
84 | ret = ib_detach_mcast(qp: priv->qp, gid: mgid, lid: mlid); |
85 | |
86 | return ret; |
87 | } |
88 | |
89 | int ipoib_init_qp(struct net_device *dev) |
90 | { |
91 | struct ipoib_dev_priv *priv = ipoib_priv(dev); |
92 | int ret; |
93 | struct ib_qp_attr qp_attr; |
94 | int attr_mask; |
95 | |
96 | if (!test_bit(IPOIB_PKEY_ASSIGNED, &priv->flags)) |
97 | return -1; |
98 | |
99 | qp_attr.qp_state = IB_QPS_INIT; |
100 | qp_attr.qkey = 0; |
101 | qp_attr.port_num = priv->port; |
102 | qp_attr.pkey_index = priv->pkey_index; |
103 | attr_mask = |
104 | IB_QP_QKEY | |
105 | IB_QP_PORT | |
106 | IB_QP_PKEY_INDEX | |
107 | IB_QP_STATE; |
108 | ret = ib_modify_qp(qp: priv->qp, qp_attr: &qp_attr, qp_attr_mask: attr_mask); |
109 | if (ret) { |
110 | ipoib_warn(priv, "failed to modify QP to init, ret = %d\n" , ret); |
111 | goto out_fail; |
112 | } |
113 | |
114 | qp_attr.qp_state = IB_QPS_RTR; |
115 | /* Can't set this in a INIT->RTR transition */ |
116 | attr_mask &= ~IB_QP_PORT; |
117 | ret = ib_modify_qp(qp: priv->qp, qp_attr: &qp_attr, qp_attr_mask: attr_mask); |
118 | if (ret) { |
119 | ipoib_warn(priv, "failed to modify QP to RTR, ret = %d\n" , ret); |
120 | goto out_fail; |
121 | } |
122 | |
123 | qp_attr.qp_state = IB_QPS_RTS; |
124 | qp_attr.sq_psn = 0; |
125 | attr_mask |= IB_QP_SQ_PSN; |
126 | attr_mask &= ~IB_QP_PKEY_INDEX; |
127 | ret = ib_modify_qp(qp: priv->qp, qp_attr: &qp_attr, qp_attr_mask: attr_mask); |
128 | if (ret) { |
129 | ipoib_warn(priv, "failed to modify QP to RTS, ret = %d\n" , ret); |
130 | goto out_fail; |
131 | } |
132 | |
133 | return 0; |
134 | |
135 | out_fail: |
136 | qp_attr.qp_state = IB_QPS_RESET; |
137 | if (ib_modify_qp(qp: priv->qp, qp_attr: &qp_attr, qp_attr_mask: IB_QP_STATE)) |
138 | ipoib_warn(priv, "Failed to modify QP to RESET state\n" ); |
139 | |
140 | return ret; |
141 | } |
142 | |
143 | int ipoib_transport_dev_init(struct net_device *dev, struct ib_device *ca) |
144 | { |
145 | struct ipoib_dev_priv *priv = ipoib_priv(dev); |
146 | struct ib_qp_init_attr init_attr = { |
147 | .cap = { |
148 | .max_send_wr = ipoib_sendq_size, |
149 | .max_recv_wr = ipoib_recvq_size, |
150 | .max_send_sge = min_t(u32, priv->ca->attrs.max_send_sge, |
151 | MAX_SKB_FRAGS + 1), |
152 | .max_recv_sge = IPOIB_UD_RX_SG |
153 | }, |
154 | .sq_sig_type = IB_SIGNAL_ALL_WR, |
155 | .qp_type = IB_QPT_UD |
156 | }; |
157 | struct ib_cq_init_attr cq_attr = {}; |
158 | |
159 | int ret, size, req_vec; |
160 | int i; |
161 | static atomic_t counter; |
162 | |
163 | size = ipoib_recvq_size + 1; |
164 | ret = ipoib_cm_dev_init(dev); |
165 | if (!ret) { |
166 | size += ipoib_sendq_size; |
167 | if (ipoib_cm_has_srq(dev)) |
168 | size += ipoib_recvq_size + 1; /* 1 extra for rx_drain_qp */ |
169 | else |
170 | size += ipoib_recvq_size * ipoib_max_conn_qp; |
171 | } else |
172 | if (ret != -EOPNOTSUPP) |
173 | return ret; |
174 | |
175 | req_vec = atomic_inc_return(v: &counter) * 2; |
176 | cq_attr.cqe = size; |
177 | cq_attr.comp_vector = req_vec % priv->ca->num_comp_vectors; |
178 | priv->recv_cq = ib_create_cq(priv->ca, ipoib_ib_rx_completion, NULL, |
179 | priv, &cq_attr); |
180 | if (IS_ERR(ptr: priv->recv_cq)) { |
181 | pr_warn("%s: failed to create receive CQ\n" , ca->name); |
182 | goto out_cm_dev_cleanup; |
183 | } |
184 | |
185 | cq_attr.cqe = ipoib_sendq_size; |
186 | cq_attr.comp_vector = (req_vec + 1) % priv->ca->num_comp_vectors; |
187 | priv->send_cq = ib_create_cq(priv->ca, ipoib_ib_tx_completion, NULL, |
188 | priv, &cq_attr); |
189 | if (IS_ERR(ptr: priv->send_cq)) { |
190 | pr_warn("%s: failed to create send CQ\n" , ca->name); |
191 | goto out_free_recv_cq; |
192 | } |
193 | |
194 | if (ib_req_notify_cq(cq: priv->recv_cq, flags: IB_CQ_NEXT_COMP)) |
195 | goto out_free_send_cq; |
196 | |
197 | init_attr.send_cq = priv->send_cq; |
198 | init_attr.recv_cq = priv->recv_cq; |
199 | |
200 | if (priv->kernel_caps & IBK_UD_TSO) |
201 | init_attr.create_flags |= IB_QP_CREATE_IPOIB_UD_LSO; |
202 | |
203 | if (priv->kernel_caps & IBK_BLOCK_MULTICAST_LOOPBACK) |
204 | init_attr.create_flags |= IB_QP_CREATE_BLOCK_MULTICAST_LOOPBACK; |
205 | |
206 | if (priv->hca_caps & IB_DEVICE_MANAGED_FLOW_STEERING) |
207 | init_attr.create_flags |= IB_QP_CREATE_NETIF_QP; |
208 | |
209 | if (priv->kernel_caps & IBK_RDMA_NETDEV_OPA) |
210 | init_attr.create_flags |= IB_QP_CREATE_NETDEV_USE; |
211 | |
212 | priv->qp = ib_create_qp(pd: priv->pd, init_attr: &init_attr); |
213 | if (IS_ERR(ptr: priv->qp)) { |
214 | pr_warn("%s: failed to create QP\n" , ca->name); |
215 | goto out_free_send_cq; |
216 | } |
217 | |
218 | if (ib_req_notify_cq(cq: priv->send_cq, flags: IB_CQ_NEXT_COMP)) |
219 | goto out_free_send_cq; |
220 | |
221 | for (i = 0; i < MAX_SKB_FRAGS + 1; ++i) |
222 | priv->tx_sge[i].lkey = priv->pd->local_dma_lkey; |
223 | |
224 | priv->tx_wr.wr.opcode = IB_WR_SEND; |
225 | priv->tx_wr.wr.sg_list = priv->tx_sge; |
226 | priv->tx_wr.wr.send_flags = IB_SEND_SIGNALED; |
227 | |
228 | priv->rx_sge[0].lkey = priv->pd->local_dma_lkey; |
229 | |
230 | priv->rx_sge[0].length = IPOIB_UD_BUF_SIZE(priv->max_ib_mtu); |
231 | priv->rx_wr.num_sge = 1; |
232 | |
233 | priv->rx_wr.next = NULL; |
234 | priv->rx_wr.sg_list = priv->rx_sge; |
235 | |
236 | if (init_attr.cap.max_send_sge > 1) |
237 | dev->features |= NETIF_F_SG; |
238 | |
239 | priv->max_send_sge = init_attr.cap.max_send_sge; |
240 | |
241 | return 0; |
242 | |
243 | out_free_send_cq: |
244 | ib_destroy_cq(cq: priv->send_cq); |
245 | |
246 | out_free_recv_cq: |
247 | ib_destroy_cq(cq: priv->recv_cq); |
248 | |
249 | out_cm_dev_cleanup: |
250 | ipoib_cm_dev_cleanup(dev); |
251 | |
252 | return -ENODEV; |
253 | } |
254 | |
255 | void ipoib_transport_dev_cleanup(struct net_device *dev) |
256 | { |
257 | struct ipoib_dev_priv *priv = ipoib_priv(dev); |
258 | |
259 | if (priv->qp) { |
260 | if (ib_destroy_qp(qp: priv->qp)) |
261 | ipoib_warn(priv, "ib_qp_destroy failed\n" ); |
262 | |
263 | priv->qp = NULL; |
264 | } |
265 | |
266 | ib_destroy_cq(cq: priv->send_cq); |
267 | ib_destroy_cq(cq: priv->recv_cq); |
268 | } |
269 | |
270 | void ipoib_event(struct ib_event_handler *handler, |
271 | struct ib_event *record) |
272 | { |
273 | struct ipoib_dev_priv *priv = |
274 | container_of(handler, struct ipoib_dev_priv, event_handler); |
275 | |
276 | if (record->element.port_num != priv->port) |
277 | return; |
278 | |
279 | ipoib_dbg(priv, "Event %d on device %s port %d\n" , record->event, |
280 | dev_name(&record->device->dev), record->element.port_num); |
281 | |
282 | if (record->event == IB_EVENT_CLIENT_REREGISTER) { |
283 | queue_work(wq: ipoib_workqueue, work: &priv->flush_light); |
284 | } else if (record->event == IB_EVENT_PORT_ERR || |
285 | record->event == IB_EVENT_PORT_ACTIVE || |
286 | record->event == IB_EVENT_LID_CHANGE) { |
287 | queue_work(wq: ipoib_workqueue, work: &priv->flush_normal); |
288 | } else if (record->event == IB_EVENT_PKEY_CHANGE) { |
289 | queue_work(wq: ipoib_workqueue, work: &priv->flush_heavy); |
290 | } else if (record->event == IB_EVENT_GID_CHANGE && |
291 | !test_bit(IPOIB_FLAG_DEV_ADDR_SET, &priv->flags)) { |
292 | queue_work(wq: ipoib_workqueue, work: &priv->flush_light); |
293 | } |
294 | } |
295 | |