]>
Commit | Line | Data |
---|---|---|
fceaf24a | 1 | /* |
fceaf24a HJ |
2 | * Copyright (c) 2009, Microsoft Corporation. |
3 | * | |
4 | * This program is free software; you can redistribute it and/or modify it | |
5 | * under the terms and conditions of the GNU General Public License, | |
6 | * version 2, as published by the Free Software Foundation. | |
7 | * | |
8 | * This program is distributed in the hope it will be useful, but WITHOUT | |
9 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | |
10 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for | |
11 | * more details. | |
12 | * | |
13 | * You should have received a copy of the GNU General Public License along with | |
adf8d3ff | 14 | * this program; if not, see <http://www.gnu.org/licenses/>. |
fceaf24a HJ |
15 | * |
16 | * Authors: | |
d0e94d17 | 17 | * Haiyang Zhang <haiyangz@microsoft.com> |
fceaf24a | 18 | * Hank Janssen <hjanssen@microsoft.com> |
fceaf24a | 19 | */ |
eb335bc4 HJ |
20 | #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt |
21 | ||
5654e932 | 22 | #include <linux/kernel.h> |
0c3b7b2f S |
23 | #include <linux/sched.h> |
24 | #include <linux/wait.h> | |
0ffa63b0 | 25 | #include <linux/mm.h> |
b4362c9c | 26 | #include <linux/delay.h> |
21a80820 | 27 | #include <linux/io.h> |
5a0e3ad6 | 28 | #include <linux/slab.h> |
d9871158 | 29 | #include <linux/netdevice.h> |
f157e78d | 30 | #include <linux/if_ether.h> |
d6472302 | 31 | #include <linux/vmalloc.h> |
9749fed5 | 32 | #include <linux/rtnetlink.h> |
43bf99ce | 33 | #include <linux/prefetch.h> |
9749fed5 | 34 | |
c25aaf81 | 35 | #include <asm/sync_bitops.h> |
3f335ea2 | 36 | |
5ca7252a | 37 | #include "hyperv_net.h" |
fceaf24a | 38 | |
84bf9cef KS |
39 | /* |
40 | * Switch the data path from the synthetic interface to the VF | |
41 | * interface. | |
42 | */ | |
0a1275ca | 43 | void netvsc_switch_datapath(struct net_device *ndev, bool vf) |
84bf9cef | 44 | { |
3d541ac5 VK |
45 | struct net_device_context *net_device_ctx = netdev_priv(ndev); |
46 | struct hv_device *dev = net_device_ctx->device_ctx; | |
79e8cbe7 | 47 | struct netvsc_device *nv_dev = rtnl_dereference(net_device_ctx->nvdev); |
0a1275ca | 48 | struct nvsp_message *init_pkt = &nv_dev->channel_init_pkt; |
84bf9cef KS |
49 | |
50 | memset(init_pkt, 0, sizeof(struct nvsp_message)); | |
51 | init_pkt->hdr.msg_type = NVSP_MSG4_TYPE_SWITCH_DATA_PATH; | |
52 | if (vf) | |
53 | init_pkt->msg.v4_msg.active_dp.active_datapath = | |
54 | NVSP_DATAPATH_VF; | |
55 | else | |
56 | init_pkt->msg.v4_msg.active_dp.active_datapath = | |
57 | NVSP_DATAPATH_SYNTHETIC; | |
58 | ||
59 | vmbus_sendpacket(dev->channel, init_pkt, | |
60 | sizeof(struct nvsp_message), | |
61 | (unsigned long)init_pkt, | |
62 | VM_PKT_DATA_INBAND, 0); | |
63 | } | |
64 | ||
88098834 | 65 | static struct netvsc_device *alloc_net_device(void) |
fceaf24a | 66 | { |
85799a37 | 67 | struct netvsc_device *net_device; |
fceaf24a | 68 | |
85799a37 HZ |
69 | net_device = kzalloc(sizeof(struct netvsc_device), GFP_KERNEL); |
70 | if (!net_device) | |
fceaf24a HJ |
71 | return NULL; |
72 | ||
dc5cd894 | 73 | init_waitqueue_head(&net_device->wait_drain); |
c38b9c71 | 74 | net_device->destroy = false; |
84bf9cef | 75 | atomic_set(&net_device->open_cnt, 0); |
7c3877f2 HZ |
76 | net_device->max_pkt = RNDIS_MAX_PKT_DEFAULT; |
77 | net_device->pkt_align = RNDIS_PKT_ALIGN_DEFAULT; | |
8b532797 | 78 | |
fd612602 | 79 | init_completion(&net_device->channel_init_wait); |
732e4985 | 80 | init_waitqueue_head(&net_device->subchan_open); |
8195b139 | 81 | INIT_WORK(&net_device->subchan_work, rndis_set_subchannel); |
7c3877f2 | 82 | |
85799a37 | 83 | return net_device; |
fceaf24a HJ |
84 | } |
85 | ||
545a8e79 | 86 | static void free_netvsc_device(struct rcu_head *head) |
f90251c8 | 87 | { |
545a8e79 | 88 | struct netvsc_device *nvdev |
89 | = container_of(head, struct netvsc_device, rcu); | |
c0b558e5 HZ |
90 | int i; |
91 | ||
92 | for (i = 0; i < VRSS_CHANNEL_MAX; i++) | |
7426b1a5 | 93 | vfree(nvdev->chan_table[i].mrc.slots); |
c0b558e5 | 94 | |
f90251c8 HZ |
95 | kfree(nvdev); |
96 | } | |
97 | ||
545a8e79 | 98 | static void free_netvsc_device_rcu(struct netvsc_device *nvdev) |
99 | { | |
100 | call_rcu(&nvdev->rcu, free_netvsc_device); | |
101 | } | |
fceaf24a | 102 | |
7a2a0a84 | 103 | static void netvsc_destroy_buf(struct hv_device *device) |
ec91cd09 HZ |
104 | { |
105 | struct nvsp_message *revoke_packet; | |
3d541ac5 | 106 | struct net_device *ndev = hv_get_drvdata(device); |
3962981f | 107 | struct net_device_context *ndc = netdev_priv(ndev); |
108 | struct netvsc_device *net_device = rtnl_dereference(ndc->nvdev); | |
7a2a0a84 | 109 | int ret; |
ec91cd09 HZ |
110 | |
111 | /* | |
112 | * If we got a section count, it means we received a | |
113 | * SendReceiveBufferComplete msg (ie sent | |
114 | * NvspMessage1TypeSendReceiveBuffer msg) therefore, we need | |
115 | * to send a revoke msg here | |
116 | */ | |
117 | if (net_device->recv_section_cnt) { | |
118 | /* Send the revoke receive buffer */ | |
119 | revoke_packet = &net_device->revoke_packet; | |
120 | memset(revoke_packet, 0, sizeof(struct nvsp_message)); | |
121 | ||
122 | revoke_packet->hdr.msg_type = | |
123 | NVSP_MSG1_TYPE_REVOKE_RECV_BUF; | |
124 | revoke_packet->msg.v1_msg. | |
125 | revoke_recv_buf.id = NETVSC_RECEIVE_BUFFER_ID; | |
126 | ||
3d541ac5 | 127 | ret = vmbus_sendpacket(device->channel, |
ec91cd09 HZ |
128 | revoke_packet, |
129 | sizeof(struct nvsp_message), | |
130 | (unsigned long)revoke_packet, | |
131 | VM_PKT_DATA_INBAND, 0); | |
73e64fa4 S |
132 | /* If the failure is because the channel is rescinded; |
133 | * ignore the failure since we cannot send on a rescinded | |
134 | * channel. This would allow us to properly cleanup | |
135 | * even when the channel is rescinded. | |
136 | */ | |
137 | if (device->channel->rescind) | |
138 | ret = 0; | |
ec91cd09 HZ |
139 | /* |
140 | * If we failed here, we might as well return and | |
141 | * have a leak rather than continue and a bugchk | |
142 | */ | |
143 | if (ret != 0) { | |
d9871158 | 144 | netdev_err(ndev, "unable to send " |
c909ebbd | 145 | "revoke receive buffer to netvsp\n"); |
7a2a0a84 | 146 | return; |
ec91cd09 | 147 | } |
8b532797 | 148 | net_device->recv_section_cnt = 0; |
ec91cd09 HZ |
149 | } |
150 | ||
151 | /* Teardown the gpadl on the vsp end */ | |
152 | if (net_device->recv_buf_gpadl_handle) { | |
3d541ac5 VK |
153 | ret = vmbus_teardown_gpadl(device->channel, |
154 | net_device->recv_buf_gpadl_handle); | |
ec91cd09 HZ |
155 | |
156 | /* If we failed here, we might as well return and have a leak | |
157 | * rather than continue and a bugchk | |
158 | */ | |
159 | if (ret != 0) { | |
d9871158 | 160 | netdev_err(ndev, |
c909ebbd | 161 | "unable to teardown receive buffer's gpadl\n"); |
7a2a0a84 | 162 | return; |
ec91cd09 HZ |
163 | } |
164 | net_device->recv_buf_gpadl_handle = 0; | |
165 | } | |
166 | ||
167 | if (net_device->recv_buf) { | |
168 | /* Free up the receive buffer */ | |
b679ef73 | 169 | vfree(net_device->recv_buf); |
ec91cd09 HZ |
170 | net_device->recv_buf = NULL; |
171 | } | |
172 | ||
c25aaf81 KS |
173 | /* Deal with the send buffer we may have setup. |
174 | * If we got a send section size, it means we received a | |
c51ed182 HZ |
175 | * NVSP_MSG1_TYPE_SEND_SEND_BUF_COMPLETE msg (ie sent |
176 | * NVSP_MSG1_TYPE_SEND_SEND_BUF msg) therefore, we need | |
c25aaf81 KS |
177 | * to send a revoke msg here |
178 | */ | |
8b532797 | 179 | if (net_device->send_section_cnt) { |
c25aaf81 KS |
180 | /* Send the revoke receive buffer */ |
181 | revoke_packet = &net_device->revoke_packet; | |
182 | memset(revoke_packet, 0, sizeof(struct nvsp_message)); | |
183 | ||
184 | revoke_packet->hdr.msg_type = | |
185 | NVSP_MSG1_TYPE_REVOKE_SEND_BUF; | |
c51ed182 HZ |
186 | revoke_packet->msg.v1_msg.revoke_send_buf.id = |
187 | NETVSC_SEND_BUFFER_ID; | |
c25aaf81 | 188 | |
3d541ac5 | 189 | ret = vmbus_sendpacket(device->channel, |
c25aaf81 KS |
190 | revoke_packet, |
191 | sizeof(struct nvsp_message), | |
192 | (unsigned long)revoke_packet, | |
193 | VM_PKT_DATA_INBAND, 0); | |
73e64fa4 S |
194 | |
195 | /* If the failure is because the channel is rescinded; | |
196 | * ignore the failure since we cannot send on a rescinded | |
197 | * channel. This would allow us to properly cleanup | |
198 | * even when the channel is rescinded. | |
199 | */ | |
200 | if (device->channel->rescind) | |
201 | ret = 0; | |
202 | ||
c25aaf81 KS |
203 | /* If we failed here, we might as well return and |
204 | * have a leak rather than continue and a bugchk | |
205 | */ | |
206 | if (ret != 0) { | |
207 | netdev_err(ndev, "unable to send " | |
208 | "revoke send buffer to netvsp\n"); | |
7a2a0a84 | 209 | return; |
c25aaf81 | 210 | } |
8b532797 | 211 | net_device->send_section_cnt = 0; |
c25aaf81 KS |
212 | } |
213 | /* Teardown the gpadl on the vsp end */ | |
214 | if (net_device->send_buf_gpadl_handle) { | |
3d541ac5 | 215 | ret = vmbus_teardown_gpadl(device->channel, |
c25aaf81 KS |
216 | net_device->send_buf_gpadl_handle); |
217 | ||
218 | /* If we failed here, we might as well return and have a leak | |
219 | * rather than continue and a bugchk | |
220 | */ | |
221 | if (ret != 0) { | |
222 | netdev_err(ndev, | |
223 | "unable to teardown send buffer's gpadl\n"); | |
7a2a0a84 | 224 | return; |
c25aaf81 | 225 | } |
2f18423d | 226 | net_device->send_buf_gpadl_handle = 0; |
c25aaf81 KS |
227 | } |
228 | if (net_device->send_buf) { | |
c51ed182 | 229 | /* Free up the send buffer */ |
06b47aac | 230 | vfree(net_device->send_buf); |
c25aaf81 KS |
231 | net_device->send_buf = NULL; |
232 | } | |
233 | kfree(net_device->send_section_map); | |
ec91cd09 HZ |
234 | } |
235 | ||
7426b1a5 | 236 | int netvsc_alloc_recv_comp_ring(struct netvsc_device *net_device, u32 q_idx) |
237 | { | |
238 | struct netvsc_channel *nvchan = &net_device->chan_table[q_idx]; | |
239 | int node = cpu_to_node(nvchan->channel->target_cpu); | |
240 | size_t size; | |
241 | ||
242 | size = net_device->recv_completion_cnt * sizeof(struct recv_comp_data); | |
243 | nvchan->mrc.slots = vzalloc_node(size, node); | |
244 | if (!nvchan->mrc.slots) | |
245 | nvchan->mrc.slots = vzalloc(size); | |
246 | ||
247 | return nvchan->mrc.slots ? 0 : -ENOMEM; | |
248 | } | |
249 | ||
95790837 | 250 | static int netvsc_init_buf(struct hv_device *device, |
8b532797 | 251 | struct netvsc_device *net_device, |
252 | const struct netvsc_device_info *device_info) | |
fceaf24a | 253 | { |
7426b1a5 | 254 | struct nvsp_1_message_send_receive_buffer_complete *resp; |
95833370 | 255 | struct net_device *ndev = hv_get_drvdata(device); |
256 | struct nvsp_message *init_packet; | |
8b532797 | 257 | unsigned int buf_size; |
fdfb70d2 | 258 | size_t map_words; |
95833370 | 259 | int ret = 0; |
0a726c2b | 260 | |
8b532797 | 261 | /* Get receive buffer area. */ |
0ab09bef | 262 | buf_size = device_info->recv_sections * device_info->recv_section_size; |
8b532797 | 263 | buf_size = roundup(buf_size, PAGE_SIZE); |
264 | ||
265 | net_device->recv_buf = vzalloc(buf_size); | |
53d21fdb | 266 | if (!net_device->recv_buf) { |
8b532797 | 267 | netdev_err(ndev, |
268 | "unable to allocate receive buffer of size %u\n", | |
269 | buf_size); | |
927bc33c | 270 | ret = -ENOMEM; |
0c3b7b2f | 271 | goto cleanup; |
fceaf24a | 272 | } |
fceaf24a | 273 | |
454f18a9 BP |
274 | /* |
275 | * Establish the gpadl handle for this buffer on this | |
276 | * channel. Note: This call uses the vmbus connection rather | |
277 | * than the channel to establish the gpadl handle. | |
278 | */ | |
53d21fdb | 279 | ret = vmbus_establish_gpadl(device->channel, net_device->recv_buf, |
8b532797 | 280 | buf_size, |
53d21fdb | 281 | &net_device->recv_buf_gpadl_handle); |
21a80820 | 282 | if (ret != 0) { |
d9871158 | 283 | netdev_err(ndev, |
c909ebbd | 284 | "unable to establish receive buffer's gpadl\n"); |
0c3b7b2f | 285 | goto cleanup; |
fceaf24a HJ |
286 | } |
287 | ||
454f18a9 | 288 | /* Notify the NetVsp of the gpadl handle */ |
53d21fdb | 289 | init_packet = &net_device->channel_init_pkt; |
85799a37 | 290 | memset(init_packet, 0, sizeof(struct nvsp_message)); |
53d21fdb HZ |
291 | init_packet->hdr.msg_type = NVSP_MSG1_TYPE_SEND_RECV_BUF; |
292 | init_packet->msg.v1_msg.send_recv_buf. | |
293 | gpadl_handle = net_device->recv_buf_gpadl_handle; | |
294 | init_packet->msg.v1_msg. | |
295 | send_recv_buf.id = NETVSC_RECEIVE_BUFFER_ID; | |
fceaf24a | 296 | |
454f18a9 | 297 | /* Send the gpadl notification request */ |
85799a37 | 298 | ret = vmbus_sendpacket(device->channel, init_packet, |
5a4df290 | 299 | sizeof(struct nvsp_message), |
85799a37 | 300 | (unsigned long)init_packet, |
415f2287 | 301 | VM_PKT_DATA_INBAND, |
5a4df290 | 302 | VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED); |
21a80820 | 303 | if (ret != 0) { |
d9871158 | 304 | netdev_err(ndev, |
c909ebbd | 305 | "unable to send receive buffer's gpadl to netvsp\n"); |
0c3b7b2f | 306 | goto cleanup; |
fceaf24a HJ |
307 | } |
308 | ||
5362855a | 309 | wait_for_completion(&net_device->channel_init_wait); |
fceaf24a | 310 | |
454f18a9 | 311 | /* Check the response */ |
7426b1a5 | 312 | resp = &init_packet->msg.v1_msg.send_recv_buf_complete; |
313 | if (resp->status != NVSP_STAT_SUCCESS) { | |
314 | netdev_err(ndev, | |
315 | "Unable to complete receive buffer initialization with NetVsp - status %d\n", | |
316 | resp->status); | |
927bc33c | 317 | ret = -EINVAL; |
0c3b7b2f | 318 | goto cleanup; |
fceaf24a HJ |
319 | } |
320 | ||
454f18a9 | 321 | /* Parse the response */ |
7426b1a5 | 322 | netdev_dbg(ndev, "Receive sections: %u sub_allocs: size %u count: %u\n", |
323 | resp->num_sections, resp->sections[0].sub_alloc_size, | |
324 | resp->sections[0].num_sub_allocs); | |
fceaf24a | 325 | |
8b532797 | 326 | /* There should only be one section for the entire receive buffer */ |
327 | if (resp->num_sections != 1 || resp->sections[0].offset != 0) { | |
927bc33c | 328 | ret = -EINVAL; |
0c3b7b2f | 329 | goto cleanup; |
fceaf24a HJ |
330 | } |
331 | ||
8b532797 | 332 | net_device->recv_section_size = resp->sections[0].sub_alloc_size; |
333 | net_device->recv_section_cnt = resp->sections[0].num_sub_allocs; | |
334 | ||
7426b1a5 | 335 | /* Setup receive completion ring */ |
336 | net_device->recv_completion_cnt | |
8b532797 | 337 | = round_up(net_device->recv_section_cnt + 1, |
7426b1a5 | 338 | PAGE_SIZE / sizeof(u64)); |
339 | ret = netvsc_alloc_recv_comp_ring(net_device, 0); | |
340 | if (ret) | |
341 | goto cleanup; | |
342 | ||
343 | /* Now setup the send buffer. */ | |
0ab09bef | 344 | buf_size = device_info->send_sections * device_info->send_section_size; |
8b532797 | 345 | buf_size = round_up(buf_size, PAGE_SIZE); |
346 | ||
347 | net_device->send_buf = vzalloc(buf_size); | |
c25aaf81 | 348 | if (!net_device->send_buf) { |
8b532797 | 349 | netdev_err(ndev, "unable to allocate send buffer of size %u\n", |
350 | buf_size); | |
c25aaf81 KS |
351 | ret = -ENOMEM; |
352 | goto cleanup; | |
353 | } | |
354 | ||
355 | /* Establish the gpadl handle for this buffer on this | |
356 | * channel. Note: This call uses the vmbus connection rather | |
357 | * than the channel to establish the gpadl handle. | |
358 | */ | |
359 | ret = vmbus_establish_gpadl(device->channel, net_device->send_buf, | |
8b532797 | 360 | buf_size, |
c25aaf81 KS |
361 | &net_device->send_buf_gpadl_handle); |
362 | if (ret != 0) { | |
363 | netdev_err(ndev, | |
364 | "unable to establish send buffer's gpadl\n"); | |
365 | goto cleanup; | |
366 | } | |
367 | ||
368 | /* Notify the NetVsp of the gpadl handle */ | |
369 | init_packet = &net_device->channel_init_pkt; | |
370 | memset(init_packet, 0, sizeof(struct nvsp_message)); | |
371 | init_packet->hdr.msg_type = NVSP_MSG1_TYPE_SEND_SEND_BUF; | |
c51ed182 | 372 | init_packet->msg.v1_msg.send_send_buf.gpadl_handle = |
c25aaf81 | 373 | net_device->send_buf_gpadl_handle; |
c51ed182 | 374 | init_packet->msg.v1_msg.send_send_buf.id = NETVSC_SEND_BUFFER_ID; |
c25aaf81 KS |
375 | |
376 | /* Send the gpadl notification request */ | |
377 | ret = vmbus_sendpacket(device->channel, init_packet, | |
378 | sizeof(struct nvsp_message), | |
379 | (unsigned long)init_packet, | |
380 | VM_PKT_DATA_INBAND, | |
381 | VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED); | |
382 | if (ret != 0) { | |
383 | netdev_err(ndev, | |
384 | "unable to send send buffer's gpadl to netvsp\n"); | |
385 | goto cleanup; | |
386 | } | |
387 | ||
5362855a | 388 | wait_for_completion(&net_device->channel_init_wait); |
c25aaf81 KS |
389 | |
390 | /* Check the response */ | |
391 | if (init_packet->msg.v1_msg. | |
392 | send_send_buf_complete.status != NVSP_STAT_SUCCESS) { | |
393 | netdev_err(ndev, "Unable to complete send buffer " | |
394 | "initialization with NetVsp - status %d\n", | |
395 | init_packet->msg.v1_msg. | |
c51ed182 | 396 | send_send_buf_complete.status); |
c25aaf81 KS |
397 | ret = -EINVAL; |
398 | goto cleanup; | |
399 | } | |
400 | ||
401 | /* Parse the response */ | |
402 | net_device->send_section_size = init_packet->msg. | |
403 | v1_msg.send_send_buf_complete.section_size; | |
404 | ||
8b532797 | 405 | /* Section count is simply the size divided by the section size. */ |
406 | net_device->send_section_cnt = buf_size / net_device->send_section_size; | |
c25aaf81 | 407 | |
93ba2222 VK |
408 | netdev_dbg(ndev, "Send section size: %d, Section count:%d\n", |
409 | net_device->send_section_size, net_device->send_section_cnt); | |
c25aaf81 KS |
410 | |
411 | /* Setup state for managing the send buffer. */ | |
fdfb70d2 | 412 | map_words = DIV_ROUND_UP(net_device->send_section_cnt, BITS_PER_LONG); |
c25aaf81 | 413 | |
fdfb70d2 | 414 | net_device->send_section_map = kcalloc(map_words, sizeof(ulong), GFP_KERNEL); |
dd1d3f8f WY |
415 | if (net_device->send_section_map == NULL) { |
416 | ret = -ENOMEM; | |
c25aaf81 | 417 | goto cleanup; |
dd1d3f8f | 418 | } |
c25aaf81 | 419 | |
0c3b7b2f | 420 | goto exit; |
fceaf24a | 421 | |
0c3b7b2f | 422 | cleanup: |
3d541ac5 | 423 | netvsc_destroy_buf(device); |
fceaf24a | 424 | |
0c3b7b2f | 425 | exit: |
fceaf24a HJ |
426 | return ret; |
427 | } | |
428 | ||
f157e78d HZ |
429 | /* Negotiate NVSP protocol version */ |
430 | static int negotiate_nvsp_ver(struct hv_device *device, | |
431 | struct netvsc_device *net_device, | |
432 | struct nvsp_message *init_packet, | |
433 | u32 nvsp_ver) | |
fceaf24a | 434 | { |
0a1275ca | 435 | struct net_device *ndev = hv_get_drvdata(device); |
7390fe9c | 436 | int ret; |
fceaf24a | 437 | |
85799a37 | 438 | memset(init_packet, 0, sizeof(struct nvsp_message)); |
53d21fdb | 439 | init_packet->hdr.msg_type = NVSP_MSG_TYPE_INIT; |
f157e78d HZ |
440 | init_packet->msg.init_msg.init.min_protocol_ver = nvsp_ver; |
441 | init_packet->msg.init_msg.init.max_protocol_ver = nvsp_ver; | |
fceaf24a | 442 | |
454f18a9 | 443 | /* Send the init request */ |
85799a37 | 444 | ret = vmbus_sendpacket(device->channel, init_packet, |
5a4df290 | 445 | sizeof(struct nvsp_message), |
85799a37 | 446 | (unsigned long)init_packet, |
415f2287 | 447 | VM_PKT_DATA_INBAND, |
5a4df290 | 448 | VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED); |
21a80820 | 449 | |
b8a3d52b | 450 | if (ret != 0) |
f157e78d | 451 | return ret; |
fceaf24a | 452 | |
5362855a | 453 | wait_for_completion(&net_device->channel_init_wait); |
fceaf24a | 454 | |
53d21fdb | 455 | if (init_packet->msg.init_msg.init_complete.status != |
f157e78d HZ |
456 | NVSP_STAT_SUCCESS) |
457 | return -EINVAL; | |
fceaf24a | 458 | |
a1eabb01 | 459 | if (nvsp_ver == NVSP_PROTOCOL_VERSION_1) |
f157e78d HZ |
460 | return 0; |
461 | ||
71790a27 | 462 | /* NVSPv2 or later: Send NDIS config */ |
f157e78d HZ |
463 | memset(init_packet, 0, sizeof(struct nvsp_message)); |
464 | init_packet->hdr.msg_type = NVSP_MSG2_TYPE_SEND_NDIS_CONFIG; | |
0a1275ca | 465 | init_packet->msg.v2_msg.send_ndis_config.mtu = ndev->mtu + ETH_HLEN; |
1f5f3a75 | 466 | init_packet->msg.v2_msg.send_ndis_config.capability.ieee8021q = 1; |
f157e78d | 467 | |
7f5d5af0 | 468 | if (nvsp_ver >= NVSP_PROTOCOL_VERSION_5) { |
71790a27 HZ |
469 | init_packet->msg.v2_msg.send_ndis_config.capability.sriov = 1; |
470 | ||
7f5d5af0 HZ |
471 | /* Teaming bit is needed to receive link speed updates */ |
472 | init_packet->msg.v2_msg.send_ndis_config.capability.teaming = 1; | |
473 | } | |
474 | ||
f157e78d HZ |
475 | ret = vmbus_sendpacket(device->channel, init_packet, |
476 | sizeof(struct nvsp_message), | |
477 | (unsigned long)init_packet, | |
478 | VM_PKT_DATA_INBAND, 0); | |
479 | ||
480 | return ret; | |
481 | } | |
482 | ||
95790837 | 483 | static int netvsc_connect_vsp(struct hv_device *device, |
8b532797 | 484 | struct netvsc_device *net_device, |
485 | const struct netvsc_device_info *device_info) | |
f157e78d | 486 | { |
e5a78fad SH |
487 | const u32 ver_list[] = { |
488 | NVSP_PROTOCOL_VERSION_1, NVSP_PROTOCOL_VERSION_2, | |
95790837 | 489 | NVSP_PROTOCOL_VERSION_4, NVSP_PROTOCOL_VERSION_5 |
490 | }; | |
491 | struct nvsp_message *init_packet; | |
492 | int ndis_version, i, ret; | |
f157e78d HZ |
493 | |
494 | init_packet = &net_device->channel_init_pkt; | |
495 | ||
496 | /* Negotiate the latest NVSP protocol supported */ | |
e5a78fad | 497 | for (i = ARRAY_SIZE(ver_list) - 1; i >= 0; i--) |
a1eabb01 HZ |
498 | if (negotiate_nvsp_ver(device, net_device, init_packet, |
499 | ver_list[i]) == 0) { | |
500 | net_device->nvsp_version = ver_list[i]; | |
501 | break; | |
502 | } | |
503 | ||
504 | if (i < 0) { | |
0f48c72c | 505 | ret = -EPROTO; |
0c3b7b2f | 506 | goto cleanup; |
fceaf24a | 507 | } |
f157e78d HZ |
508 | |
509 | pr_debug("Negotiated NVSP version:%x\n", net_device->nvsp_version); | |
510 | ||
454f18a9 | 511 | /* Send the ndis version */ |
85799a37 | 512 | memset(init_packet, 0, sizeof(struct nvsp_message)); |
fceaf24a | 513 | |
a1eabb01 | 514 | if (net_device->nvsp_version <= NVSP_PROTOCOL_VERSION_4) |
1f73db49 | 515 | ndis_version = 0x00060001; |
a1eabb01 HZ |
516 | else |
517 | ndis_version = 0x0006001e; | |
fceaf24a | 518 | |
53d21fdb HZ |
519 | init_packet->hdr.msg_type = NVSP_MSG1_TYPE_SEND_NDIS_VER; |
520 | init_packet->msg.v1_msg. | |
521 | send_ndis_ver.ndis_major_ver = | |
85799a37 | 522 | (ndis_version & 0xFFFF0000) >> 16; |
53d21fdb HZ |
523 | init_packet->msg.v1_msg. |
524 | send_ndis_ver.ndis_minor_ver = | |
85799a37 | 525 | ndis_version & 0xFFFF; |
fceaf24a | 526 | |
454f18a9 | 527 | /* Send the init request */ |
85799a37 | 528 | ret = vmbus_sendpacket(device->channel, init_packet, |
0c3b7b2f S |
529 | sizeof(struct nvsp_message), |
530 | (unsigned long)init_packet, | |
531 | VM_PKT_DATA_INBAND, 0); | |
0f48c72c | 532 | if (ret != 0) |
0c3b7b2f | 533 | goto cleanup; |
454f18a9 | 534 | |
99d3016d | 535 | |
8b532797 | 536 | ret = netvsc_init_buf(device, net_device, device_info); |
fceaf24a | 537 | |
0c3b7b2f | 538 | cleanup: |
fceaf24a HJ |
539 | return ret; |
540 | } | |
541 | ||
3d541ac5 | 542 | static void netvsc_disconnect_vsp(struct hv_device *device) |
fceaf24a | 543 | { |
3d541ac5 | 544 | netvsc_destroy_buf(device); |
fceaf24a HJ |
545 | } |
546 | ||
3e189519 | 547 | /* |
5a71ae30 | 548 | * netvsc_device_remove - Callback when the root bus device is removed |
21a80820 | 549 | */ |
e08f3ea5 | 550 | void netvsc_device_remove(struct hv_device *device) |
fceaf24a | 551 | { |
3d541ac5 VK |
552 | struct net_device *ndev = hv_get_drvdata(device); |
553 | struct net_device_context *net_device_ctx = netdev_priv(ndev); | |
79e8cbe7 | 554 | struct netvsc_device *net_device |
555 | = rtnl_dereference(net_device_ctx->nvdev); | |
15a863bf | 556 | int i; |
fceaf24a | 557 | |
8195b139 SH |
558 | cancel_work_sync(&net_device->subchan_work); |
559 | ||
3d541ac5 | 560 | netvsc_disconnect_vsp(device); |
9d88f33a | 561 | |
545a8e79 | 562 | RCU_INIT_POINTER(net_device_ctx->nvdev, NULL); |
3852409b | 563 | |
86c921af S |
564 | /* |
565 | * At this point, no one should be accessing net_device | |
566 | * except in here | |
567 | */ | |
93ba2222 | 568 | netdev_dbg(ndev, "net device safe to remove\n"); |
fceaf24a | 569 | |
454f18a9 | 570 | /* Now, we can close the channel safely */ |
85799a37 | 571 | vmbus_close(device->channel); |
fceaf24a | 572 | |
76bb5db5 | 573 | /* And dissassociate NAPI context from device */ |
79cd874c | 574 | for (i = 0; i < net_device->num_chn; i++) |
76bb5db5 | 575 | netif_napi_del(&net_device->chan_table[i].napi); |
15a863bf | 576 | |
454f18a9 | 577 | /* Release all resources */ |
545a8e79 | 578 | free_netvsc_device_rcu(net_device); |
fceaf24a HJ |
579 | } |
580 | ||
33be96e4 HZ |
581 | #define RING_AVAIL_PERCENT_HIWATER 20 |
582 | #define RING_AVAIL_PERCENT_LOWATER 10 | |
583 | ||
584 | /* | |
585 | * Get the percentage of available bytes to write in the ring. | |
586 | * The return value is in range from 0 to 100. | |
587 | */ | |
588 | static inline u32 hv_ringbuf_avail_percent( | |
589 | struct hv_ring_buffer_info *ring_info) | |
590 | { | |
591 | u32 avail_read, avail_write; | |
592 | ||
593 | hv_get_ringbuffer_availbytes(ring_info, &avail_read, &avail_write); | |
594 | ||
595 | return avail_write * 100 / ring_info->ring_datasize; | |
596 | } | |
597 | ||
c25aaf81 KS |
598 | static inline void netvsc_free_send_slot(struct netvsc_device *net_device, |
599 | u32 index) | |
600 | { | |
601 | sync_change_bit(index, net_device->send_section_map); | |
602 | } | |
603 | ||
bc304dd3 SH |
604 | static void netvsc_send_tx_complete(struct netvsc_device *net_device, |
605 | struct vmbus_channel *incoming_channel, | |
606 | struct hv_device *device, | |
f9645430 | 607 | const struct vmpacket_descriptor *desc, |
608 | int budget) | |
bc304dd3 | 609 | { |
50698d80 | 610 | struct sk_buff *skb = (struct sk_buff *)(unsigned long)desc->trans_id; |
bc304dd3 | 611 | struct net_device *ndev = hv_get_drvdata(device); |
bc304dd3 | 612 | struct vmbus_channel *channel = device->channel; |
bc304dd3 SH |
613 | u16 q_idx = 0; |
614 | int queue_sends; | |
615 | ||
616 | /* Notify the layer above us */ | |
617 | if (likely(skb)) { | |
793e3955 | 618 | const struct hv_netvsc_packet *packet |
bc304dd3 | 619 | = (struct hv_netvsc_packet *)skb->cb; |
793e3955 | 620 | u32 send_index = packet->send_buf_index; |
621 | struct netvsc_stats *tx_stats; | |
bc304dd3 SH |
622 | |
623 | if (send_index != NETVSC_INVALID_INDEX) | |
624 | netvsc_free_send_slot(net_device, send_index); | |
793e3955 | 625 | q_idx = packet->q_idx; |
bc304dd3 SH |
626 | channel = incoming_channel; |
627 | ||
6c80f3fc | 628 | tx_stats = &net_device->chan_table[q_idx].tx_stats; |
793e3955 | 629 | |
630 | u64_stats_update_begin(&tx_stats->syncp); | |
631 | tx_stats->packets += packet->total_packets; | |
632 | tx_stats->bytes += packet->total_bytes; | |
633 | u64_stats_update_end(&tx_stats->syncp); | |
634 | ||
f9645430 | 635 | napi_consume_skb(skb, budget); |
bc304dd3 SH |
636 | } |
637 | ||
b8b835a8 | 638 | queue_sends = |
639 | atomic_dec_return(&net_device->chan_table[q_idx].queue_sends); | |
bc304dd3 | 640 | |
46b4f7f5 | 641 | if (net_device->destroy && queue_sends == 0) |
bc304dd3 SH |
642 | wake_up(&net_device->wait_drain); |
643 | ||
644 | if (netif_tx_queue_stopped(netdev_get_tx_queue(ndev, q_idx)) && | |
bc304dd3 SH |
645 | (hv_ringbuf_avail_percent(&channel->outbound) > RING_AVAIL_PERCENT_HIWATER || |
646 | queue_sends < 1)) | |
647 | netif_tx_wake_queue(netdev_get_tx_queue(ndev, q_idx)); | |
648 | } | |
649 | ||
97c1723a | 650 | static void netvsc_send_completion(struct netvsc_device *net_device, |
25b85ee8 | 651 | struct vmbus_channel *incoming_channel, |
97c1723a | 652 | struct hv_device *device, |
f9645430 | 653 | const struct vmpacket_descriptor *desc, |
654 | int budget) | |
fceaf24a | 655 | { |
f3dd3f47 | 656 | struct nvsp_message *nvsp_packet = hv_pkt_data(desc); |
3d541ac5 | 657 | struct net_device *ndev = hv_get_drvdata(device); |
fceaf24a | 658 | |
bc304dd3 SH |
659 | switch (nvsp_packet->hdr.msg_type) { |
660 | case NVSP_MSG_TYPE_INIT_COMPLETE: | |
661 | case NVSP_MSG1_TYPE_SEND_RECV_BUF_COMPLETE: | |
662 | case NVSP_MSG1_TYPE_SEND_SEND_BUF_COMPLETE: | |
663 | case NVSP_MSG5_TYPE_SUBCHANNEL: | |
454f18a9 | 664 | /* Copy the response back */ |
53d21fdb | 665 | memcpy(&net_device->channel_init_pkt, nvsp_packet, |
21a80820 | 666 | sizeof(struct nvsp_message)); |
35abb21a | 667 | complete(&net_device->channel_init_wait); |
bc304dd3 SH |
668 | break; |
669 | ||
670 | case NVSP_MSG1_TYPE_SEND_RNDIS_PKT_COMPLETE: | |
671 | netvsc_send_tx_complete(net_device, incoming_channel, | |
f9645430 | 672 | device, desc, budget); |
bc304dd3 | 673 | break; |
fceaf24a | 674 | |
bc304dd3 SH |
675 | default: |
676 | netdev_err(ndev, | |
677 | "Unknown send completion type %d received!!\n", | |
678 | nvsp_packet->hdr.msg_type); | |
fceaf24a | 679 | } |
fceaf24a HJ |
680 | } |
681 | ||
c25aaf81 KS |
682 | static u32 netvsc_get_next_send_section(struct netvsc_device *net_device) |
683 | { | |
b58a1858 | 684 | unsigned long *map_addr = net_device->send_section_map; |
685 | unsigned int i; | |
686 | ||
fdfb70d2 | 687 | for_each_clear_bit(i, map_addr, net_device->send_section_cnt) { |
b58a1858 | 688 | if (sync_test_and_set_bit(i, map_addr) == 0) |
689 | return i; | |
c25aaf81 | 690 | } |
b58a1858 | 691 | |
692 | return NETVSC_INVALID_INDEX; | |
c25aaf81 KS |
693 | } |
694 | ||
da19fcd0 LP |
695 | static u32 netvsc_copy_to_send_buf(struct netvsc_device *net_device, |
696 | unsigned int section_index, | |
7c3877f2 | 697 | u32 pend_size, |
24476760 | 698 | struct hv_netvsc_packet *packet, |
a9f2e2d6 | 699 | struct rndis_message *rndis_msg, |
02b6de01 | 700 | struct hv_page_buffer *pb, |
694a9fb0 | 701 | struct sk_buff *skb) |
c25aaf81 KS |
702 | { |
703 | char *start = net_device->send_buf; | |
7c3877f2 HZ |
704 | char *dest = start + (section_index * net_device->send_section_size) |
705 | + pend_size; | |
c25aaf81 KS |
706 | int i; |
707 | u32 msg_size = 0; | |
7c3877f2 HZ |
708 | u32 padding = 0; |
709 | u32 remain = packet->total_data_buflen % net_device->pkt_align; | |
aa0a34be HZ |
710 | u32 page_count = packet->cp_partial ? packet->rmsg_pgcnt : |
711 | packet->page_buf_cnt; | |
7c3877f2 HZ |
712 | |
713 | /* Add padding */ | |
ebc1dcf6 | 714 | if (skb->xmit_more && remain && !packet->cp_partial) { |
7c3877f2 | 715 | padding = net_device->pkt_align - remain; |
24476760 | 716 | rndis_msg->msg_len += padding; |
7c3877f2 HZ |
717 | packet->total_data_buflen += padding; |
718 | } | |
c25aaf81 | 719 | |
aa0a34be | 720 | for (i = 0; i < page_count; i++) { |
02b6de01 | 721 | char *src = phys_to_virt(pb[i].pfn << PAGE_SHIFT); |
722 | u32 offset = pb[i].offset; | |
723 | u32 len = pb[i].len; | |
c25aaf81 KS |
724 | |
725 | memcpy(dest, (src + offset), len); | |
726 | msg_size += len; | |
727 | dest += len; | |
728 | } | |
7c3877f2 HZ |
729 | |
730 | if (padding) { | |
731 | memset(dest, 0, padding); | |
732 | msg_size += padding; | |
733 | } | |
734 | ||
c25aaf81 KS |
735 | return msg_size; |
736 | } | |
737 | ||
3a8963ac | 738 | static inline int netvsc_send_pkt( |
0a1275ca | 739 | struct hv_device *device, |
7c3877f2 | 740 | struct hv_netvsc_packet *packet, |
a9f2e2d6 | 741 | struct netvsc_device *net_device, |
02b6de01 | 742 | struct hv_page_buffer *pb, |
3a3d9a0a | 743 | struct sk_buff *skb) |
fceaf24a | 744 | { |
7c3877f2 | 745 | struct nvsp_message nvmsg; |
956a25c9 JP |
746 | struct nvsp_1_message_send_rndis_packet * const rpkt = |
747 | &nvmsg.msg.v1_msg.send_rndis_pkt; | |
748 | struct netvsc_channel * const nvchan = | |
749 | &net_device->chan_table[packet->q_idx]; | |
b8b835a8 | 750 | struct vmbus_channel *out_channel = nvchan->channel; |
0a1275ca | 751 | struct net_device *ndev = hv_get_drvdata(device); |
b8b835a8 | 752 | struct netdev_queue *txq = netdev_get_tx_queue(ndev, packet->q_idx); |
7c3877f2 HZ |
753 | u64 req_id; |
754 | int ret; | |
82fa3c77 | 755 | u32 ring_avail = hv_ringbuf_avail_percent(&out_channel->outbound); |
c25aaf81 | 756 | |
7c3877f2 | 757 | nvmsg.hdr.msg_type = NVSP_MSG1_TYPE_SEND_RNDIS_PKT; |
956a25c9 JP |
758 | if (skb) |
759 | rpkt->channel_type = 0; /* 0 is RMC_DATA */ | |
760 | else | |
761 | rpkt->channel_type = 1; /* 1 is RMC_CONTROL */ | |
fceaf24a | 762 | |
956a25c9 | 763 | rpkt->send_buf_section_index = packet->send_buf_index; |
7c3877f2 | 764 | if (packet->send_buf_index == NETVSC_INVALID_INDEX) |
956a25c9 | 765 | rpkt->send_buf_section_size = 0; |
7c3877f2 | 766 | else |
956a25c9 | 767 | rpkt->send_buf_section_size = packet->total_data_buflen; |
21a80820 | 768 | |
3a3d9a0a | 769 | req_id = (ulong)skb; |
f1ea3cd7 | 770 | |
c3582a2c HZ |
771 | if (out_channel->rescind) |
772 | return -ENODEV; | |
773 | ||
72a2f5bd | 774 | if (packet->page_buf_cnt) { |
02b6de01 | 775 | if (packet->cp_partial) |
776 | pb += packet->rmsg_pgcnt; | |
777 | ||
5a668d8c | 778 | ret = vmbus_sendpacket_pagebuffer(out_channel, |
779 | pb, packet->page_buf_cnt, | |
780 | &nvmsg, sizeof(nvmsg), | |
781 | req_id); | |
21a80820 | 782 | } else { |
5dd0fb9b | 783 | ret = vmbus_sendpacket(out_channel, |
784 | &nvmsg, sizeof(nvmsg), | |
785 | req_id, VM_PKT_DATA_INBAND, | |
786 | VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED); | |
fceaf24a HJ |
787 | } |
788 | ||
1d06825b | 789 | if (ret == 0) { |
b8b835a8 | 790 | atomic_inc_return(&nvchan->queue_sends); |
5b54dac8 | 791 | |
46b4f7f5 | 792 | if (ring_avail < RING_AVAIL_PERCENT_LOWATER) |
b8b835a8 | 793 | netif_tx_stop_queue(txq); |
1d06825b | 794 | } else if (ret == -EAGAIN) { |
b8b835a8 | 795 | netif_tx_stop_queue(txq); |
796 | if (atomic_read(&nvchan->queue_sends) < 1) { | |
797 | netif_tx_wake_queue(txq); | |
33be96e4 HZ |
798 | ret = -ENOSPC; |
799 | } | |
1d06825b | 800 | } else { |
4a2176c6 | 801 | netdev_err(ndev, |
802 | "Unable to send packet pages %u len %u, ret %d\n", | |
803 | packet->page_buf_cnt, packet->total_data_buflen, | |
804 | ret); | |
1d06825b | 805 | } |
fceaf24a | 806 | |
7c3877f2 HZ |
807 | return ret; |
808 | } | |
809 | ||
c85e4924 HZ |
810 | /* Move packet out of multi send data (msd), and clear msd */ |
811 | static inline void move_pkt_msd(struct hv_netvsc_packet **msd_send, | |
812 | struct sk_buff **msd_skb, | |
813 | struct multi_send_data *msdp) | |
814 | { | |
815 | *msd_skb = msdp->skb; | |
816 | *msd_send = msdp->pkt; | |
817 | msdp->skb = NULL; | |
818 | msdp->pkt = NULL; | |
819 | msdp->count = 0; | |
820 | } | |
821 | ||
2a926f79 | 822 | /* RCU already held by caller */ |
823 | int netvsc_send(struct net_device_context *ndev_ctx, | |
24476760 | 824 | struct hv_netvsc_packet *packet, |
a9f2e2d6 | 825 | struct rndis_message *rndis_msg, |
02b6de01 | 826 | struct hv_page_buffer *pb, |
3a3d9a0a | 827 | struct sk_buff *skb) |
7c3877f2 | 828 | { |
3962981f | 829 | struct netvsc_device *net_device |
867047c4 | 830 | = rcu_dereference_bh(ndev_ctx->nvdev); |
2a926f79 | 831 | struct hv_device *device = ndev_ctx->device_ctx; |
6c4c137e | 832 | int ret = 0; |
b8b835a8 | 833 | struct netvsc_channel *nvchan; |
7c3877f2 HZ |
834 | u32 pktlen = packet->total_data_buflen, msd_len = 0; |
835 | unsigned int section_index = NETVSC_INVALID_INDEX; | |
7c3877f2 HZ |
836 | struct multi_send_data *msdp; |
837 | struct hv_netvsc_packet *msd_send = NULL, *cur_send = NULL; | |
c85e4924 | 838 | struct sk_buff *msd_skb = NULL; |
aa0a34be | 839 | bool try_batch; |
bde79be5 | 840 | bool xmit_more = (skb != NULL) ? skb->xmit_more : false; |
7c3877f2 | 841 | |
592b4fe8 | 842 | /* If device is rescinded, return error and packet will get dropped. */ |
2a926f79 | 843 | if (unlikely(!net_device || net_device->destroy)) |
7c3877f2 HZ |
844 | return -ENODEV; |
845 | ||
e8f0a89c VK |
846 | /* We may race with netvsc_connect_vsp()/netvsc_init_buf() and get |
847 | * here before the negotiation with the host is finished and | |
848 | * send_section_map may not be allocated yet. | |
849 | */ | |
2d694d2a | 850 | if (unlikely(!net_device->send_section_map)) |
e8f0a89c VK |
851 | return -EAGAIN; |
852 | ||
b8b835a8 | 853 | nvchan = &net_device->chan_table[packet->q_idx]; |
7c3877f2 | 854 | packet->send_buf_index = NETVSC_INVALID_INDEX; |
aa0a34be | 855 | packet->cp_partial = false; |
7c3877f2 | 856 | |
cf8190e4 HZ |
857 | /* Send control message directly without accessing msd (Multi-Send |
858 | * Data) field which may be changed during data packet processing. | |
859 | */ | |
860 | if (!skb) { | |
861 | cur_send = packet; | |
862 | goto send_now; | |
863 | } | |
864 | ||
7c3877f2 | 865 | /* batch packets in send buffer if possible */ |
b8b835a8 | 866 | msdp = &nvchan->msd; |
7c3877f2 HZ |
867 | if (msdp->pkt) |
868 | msd_len = msdp->pkt->total_data_buflen; | |
869 | ||
ebc1dcf6 | 870 | try_batch = msd_len > 0 && msdp->count < net_device->max_pkt; |
aa0a34be | 871 | if (try_batch && msd_len + pktlen + net_device->pkt_align < |
7c3877f2 HZ |
872 | net_device->send_section_size) { |
873 | section_index = msdp->pkt->send_buf_index; | |
874 | ||
aa0a34be HZ |
875 | } else if (try_batch && msd_len + packet->rmsg_size < |
876 | net_device->send_section_size) { | |
877 | section_index = msdp->pkt->send_buf_index; | |
878 | packet->cp_partial = true; | |
879 | ||
ebc1dcf6 | 880 | } else if (pktlen + net_device->pkt_align < |
7c3877f2 HZ |
881 | net_device->send_section_size) { |
882 | section_index = netvsc_get_next_send_section(net_device); | |
cad5c197 | 883 | if (unlikely(section_index == NETVSC_INVALID_INDEX)) { |
884 | ++ndev_ctx->eth_stats.tx_send_full; | |
885 | } else { | |
c85e4924 HZ |
886 | move_pkt_msd(&msd_send, &msd_skb, msdp); |
887 | msd_len = 0; | |
7c3877f2 HZ |
888 | } |
889 | } | |
890 | ||
891 | if (section_index != NETVSC_INVALID_INDEX) { | |
892 | netvsc_copy_to_send_buf(net_device, | |
893 | section_index, msd_len, | |
694a9fb0 | 894 | packet, rndis_msg, pb, skb); |
b08cc791 | 895 | |
7c3877f2 | 896 | packet->send_buf_index = section_index; |
aa0a34be HZ |
897 | |
898 | if (packet->cp_partial) { | |
899 | packet->page_buf_cnt -= packet->rmsg_pgcnt; | |
900 | packet->total_data_buflen = msd_len + packet->rmsg_size; | |
901 | } else { | |
902 | packet->page_buf_cnt = 0; | |
903 | packet->total_data_buflen += msd_len; | |
aa0a34be | 904 | } |
7c3877f2 | 905 | |
793e3955 | 906 | if (msdp->pkt) { |
907 | packet->total_packets += msdp->pkt->total_packets; | |
908 | packet->total_bytes += msdp->pkt->total_bytes; | |
909 | } | |
910 | ||
c85e4924 | 911 | if (msdp->skb) |
17db4bce | 912 | dev_consume_skb_any(msdp->skb); |
ee90b812 | 913 | |
bde79be5 | 914 | if (xmit_more && !packet->cp_partial) { |
c85e4924 | 915 | msdp->skb = skb; |
7c3877f2 HZ |
916 | msdp->pkt = packet; |
917 | msdp->count++; | |
918 | } else { | |
919 | cur_send = packet; | |
c85e4924 | 920 | msdp->skb = NULL; |
7c3877f2 HZ |
921 | msdp->pkt = NULL; |
922 | msdp->count = 0; | |
923 | } | |
924 | } else { | |
c85e4924 | 925 | move_pkt_msd(&msd_send, &msd_skb, msdp); |
7c3877f2 HZ |
926 | cur_send = packet; |
927 | } | |
928 | ||
7c3877f2 | 929 | if (msd_send) { |
6c4c137e SH |
930 | int m_ret = netvsc_send_pkt(device, msd_send, net_device, |
931 | NULL, msd_skb); | |
7c3877f2 HZ |
932 | |
933 | if (m_ret != 0) { | |
934 | netvsc_free_send_slot(net_device, | |
935 | msd_send->send_buf_index); | |
c85e4924 | 936 | dev_kfree_skb_any(msd_skb); |
7c3877f2 HZ |
937 | } |
938 | } | |
939 | ||
cf8190e4 | 940 | send_now: |
7c3877f2 | 941 | if (cur_send) |
0a1275ca | 942 | ret = netvsc_send_pkt(device, cur_send, net_device, pb, skb); |
7c3877f2 | 943 | |
7aab5159 JS |
944 | if (ret != 0 && section_index != NETVSC_INVALID_INDEX) |
945 | netvsc_free_send_slot(net_device, section_index); | |
d953ca4d | 946 | |
fceaf24a HJ |
947 | return ret; |
948 | } | |
949 | ||
7426b1a5 | 950 | /* Send pending recv completions */ |
cad5c197 | 951 | static int send_recv_completions(struct net_device *ndev, |
952 | struct netvsc_device *nvdev, | |
953 | struct netvsc_channel *nvchan) | |
5fa9d3c5 | 954 | { |
7426b1a5 | 955 | struct multi_recv_comp *mrc = &nvchan->mrc; |
956 | struct recv_comp_msg { | |
957 | struct nvsp_message_header hdr; | |
958 | u32 status; | |
959 | } __packed; | |
960 | struct recv_comp_msg msg = { | |
961 | .hdr.msg_type = NVSP_MSG1_TYPE_SEND_RNDIS_PKT_COMPLETE, | |
962 | }; | |
5fa9d3c5 HZ |
963 | int ret; |
964 | ||
7426b1a5 | 965 | while (mrc->first != mrc->next) { |
966 | const struct recv_comp_data *rcd | |
967 | = mrc->slots + mrc->first; | |
c0b558e5 | 968 | |
7426b1a5 | 969 | msg.status = rcd->status; |
970 | ret = vmbus_sendpacket(nvchan->channel, &msg, sizeof(msg), | |
971 | rcd->tid, VM_PKT_COMP, 0); | |
cad5c197 | 972 | if (unlikely(ret)) { |
973 | struct net_device_context *ndev_ctx = netdev_priv(ndev); | |
974 | ||
975 | ++ndev_ctx->eth_stats.rx_comp_busy; | |
7426b1a5 | 976 | return ret; |
cad5c197 | 977 | } |
c0b558e5 | 978 | |
7426b1a5 | 979 | if (++mrc->first == nvdev->recv_completion_cnt) |
980 | mrc->first = 0; | |
981 | } | |
c0b558e5 | 982 | |
7426b1a5 | 983 | /* receive completion ring has been emptied */ |
984 | if (unlikely(nvdev->destroy)) | |
985 | wake_up(&nvdev->wait_drain); | |
c0b558e5 | 986 | |
7426b1a5 | 987 | return 0; |
c0b558e5 HZ |
988 | } |
989 | ||
7426b1a5 | 990 | /* Count how many receive completions are outstanding */ |
991 | static void recv_comp_slot_avail(const struct netvsc_device *nvdev, | |
992 | const struct multi_recv_comp *mrc, | |
993 | u32 *filled, u32 *avail) | |
c0b558e5 | 994 | { |
7426b1a5 | 995 | u32 count = nvdev->recv_completion_cnt; |
c0b558e5 | 996 | |
7426b1a5 | 997 | if (mrc->next >= mrc->first) |
998 | *filled = mrc->next - mrc->first; | |
999 | else | |
1000 | *filled = (count - mrc->first) + mrc->next; | |
c0b558e5 | 1001 | |
7426b1a5 | 1002 | *avail = count - *filled - 1; |
c0b558e5 HZ |
1003 | } |
1004 | ||
7426b1a5 | 1005 | /* Add receive complete to ring to send to host. */ |
1006 | static void enq_receive_complete(struct net_device *ndev, | |
1007 | struct netvsc_device *nvdev, u16 q_idx, | |
1008 | u64 tid, u32 status) | |
c0b558e5 | 1009 | { |
7426b1a5 | 1010 | struct netvsc_channel *nvchan = &nvdev->chan_table[q_idx]; |
1011 | struct multi_recv_comp *mrc = &nvchan->mrc; | |
c0b558e5 | 1012 | struct recv_comp_data *rcd; |
7426b1a5 | 1013 | u32 filled, avail; |
c0b558e5 | 1014 | |
7426b1a5 | 1015 | recv_comp_slot_avail(nvdev, mrc, &filled, &avail); |
c0b558e5 | 1016 | |
7426b1a5 | 1017 | if (unlikely(filled > NAPI_POLL_WEIGHT)) { |
cad5c197 | 1018 | send_recv_completions(ndev, nvdev, nvchan); |
7426b1a5 | 1019 | recv_comp_slot_avail(nvdev, mrc, &filled, &avail); |
5fa9d3c5 | 1020 | } |
c0b558e5 | 1021 | |
7426b1a5 | 1022 | if (unlikely(!avail)) { |
1023 | netdev_err(ndev, "Recv_comp full buf q:%hd, tid:%llx\n", | |
1024 | q_idx, tid); | |
1025 | return; | |
1026 | } | |
c0b558e5 | 1027 | |
7426b1a5 | 1028 | rcd = mrc->slots + mrc->next; |
1029 | rcd->tid = tid; | |
1030 | rcd->status = status; | |
c0b558e5 | 1031 | |
7426b1a5 | 1032 | if (++mrc->next == nvdev->recv_completion_cnt) |
1033 | mrc->next = 0; | |
c0b558e5 HZ |
1034 | } |
1035 | ||
15a863bf | 1036 | static int netvsc_receive(struct net_device *ndev, |
7426b1a5 | 1037 | struct netvsc_device *net_device, |
1038 | struct net_device_context *net_device_ctx, | |
1039 | struct hv_device *device, | |
1040 | struct vmbus_channel *channel, | |
1041 | const struct vmpacket_descriptor *desc, | |
1042 | struct nvsp_message *nvsp) | |
fceaf24a | 1043 | { |
f3dd3f47 | 1044 | const struct vmtransfer_page_packet_header *vmxferpage_packet |
1045 | = container_of(desc, const struct vmtransfer_page_packet_header, d); | |
15a863bf | 1046 | u16 q_idx = channel->offermsg.offer.sub_channel_index; |
dc54a08c | 1047 | char *recv_buf = net_device->recv_buf; |
4baab261 | 1048 | u32 status = NVSP_STAT_SUCCESS; |
45326342 HZ |
1049 | int i; |
1050 | int count = 0; | |
779b4d17 | 1051 | |
454f18a9 | 1052 | /* Make sure this is a valid nvsp packet */ |
dc54a08c | 1053 | if (unlikely(nvsp->hdr.msg_type != NVSP_MSG1_TYPE_SEND_RNDIS_PKT)) { |
1054 | netif_err(net_device_ctx, rx_err, ndev, | |
1055 | "Unknown nvsp packet type received %u\n", | |
1056 | nvsp->hdr.msg_type); | |
15a863bf | 1057 | return 0; |
fceaf24a HJ |
1058 | } |
1059 | ||
dc54a08c | 1060 | if (unlikely(vmxferpage_packet->xfer_pageset_id != NETVSC_RECEIVE_BUFFER_ID)) { |
1061 | netif_err(net_device_ctx, rx_err, ndev, | |
1062 | "Invalid xfer page set id - expecting %x got %x\n", | |
1063 | NETVSC_RECEIVE_BUFFER_ID, | |
1064 | vmxferpage_packet->xfer_pageset_id); | |
15a863bf | 1065 | return 0; |
fceaf24a HJ |
1066 | } |
1067 | ||
4baab261 | 1068 | count = vmxferpage_packet->range_cnt; |
fceaf24a | 1069 | |
454f18a9 | 1070 | /* Each range represents 1 RNDIS pkt that contains 1 ethernet frame */ |
4baab261 | 1071 | for (i = 0; i < count; i++) { |
dc54a08c | 1072 | void *data = recv_buf |
1073 | + vmxferpage_packet->ranges[i].byte_offset; | |
1074 | u32 buflen = vmxferpage_packet->ranges[i].byte_count; | |
fceaf24a | 1075 | |
454f18a9 | 1076 | /* Pass it to the upper layer */ |
dc54a08c | 1077 | status = rndis_filter_receive(ndev, net_device, device, |
1078 | channel, data, buflen); | |
fceaf24a HJ |
1079 | } |
1080 | ||
7426b1a5 | 1081 | enq_receive_complete(ndev, net_device, q_idx, |
1082 | vmxferpage_packet->d.trans_id, status); | |
15a863bf | 1083 | |
15a863bf | 1084 | return count; |
fceaf24a HJ |
1085 | } |
1086 | ||
5b54dac8 | 1087 | static void netvsc_send_table(struct hv_device *hdev, |
71790a27 | 1088 | struct nvsp_message *nvmsg) |
5b54dac8 | 1089 | { |
0a1275ca | 1090 | struct net_device *ndev = hv_get_drvdata(hdev); |
7ce10124 | 1091 | struct net_device_context *net_device_ctx = netdev_priv(ndev); |
5b54dac8 HZ |
1092 | int i; |
1093 | u32 count, *tab; | |
1094 | ||
5b54dac8 HZ |
1095 | count = nvmsg->msg.v5_msg.send_table.count; |
1096 | if (count != VRSS_SEND_TAB_SIZE) { | |
1097 | netdev_err(ndev, "Received wrong send-table size:%u\n", count); | |
1098 | return; | |
1099 | } | |
1100 | ||
1101 | tab = (u32 *)((unsigned long)&nvmsg->msg.v5_msg.send_table + | |
1102 | nvmsg->msg.v5_msg.send_table.offset); | |
1103 | ||
1104 | for (i = 0; i < count; i++) | |
7ce10124 | 1105 | net_device_ctx->tx_send_table[i] = tab[i]; |
5b54dac8 HZ |
1106 | } |
1107 | ||
f9a7da91 | 1108 | static void netvsc_send_vf(struct net_device_context *net_device_ctx, |
71790a27 HZ |
1109 | struct nvsp_message *nvmsg) |
1110 | { | |
f9a7da91 VK |
1111 | net_device_ctx->vf_alloc = nvmsg->msg.v4_msg.vf_assoc.allocated; |
1112 | net_device_ctx->vf_serial = nvmsg->msg.v4_msg.vf_assoc.serial; | |
71790a27 HZ |
1113 | } |
1114 | ||
1115 | static inline void netvsc_receive_inband(struct hv_device *hdev, | |
f9a7da91 VK |
1116 | struct net_device_context *net_device_ctx, |
1117 | struct nvsp_message *nvmsg) | |
71790a27 HZ |
1118 | { |
1119 | switch (nvmsg->hdr.msg_type) { | |
1120 | case NVSP_MSG5_TYPE_SEND_INDIRECTION_TABLE: | |
1121 | netvsc_send_table(hdev, nvmsg); | |
1122 | break; | |
1123 | ||
1124 | case NVSP_MSG4_TYPE_SEND_VF_ASSOCIATION: | |
f9a7da91 | 1125 | netvsc_send_vf(net_device_ctx, nvmsg); |
71790a27 HZ |
1126 | break; |
1127 | } | |
1128 | } | |
1129 | ||
15a863bf | 1130 | static int netvsc_process_raw_pkt(struct hv_device *device, |
1131 | struct vmbus_channel *channel, | |
1132 | struct netvsc_device *net_device, | |
1133 | struct net_device *ndev, | |
f9645430 | 1134 | const struct vmpacket_descriptor *desc, |
1135 | int budget) | |
99a50bb1 | 1136 | { |
f9a7da91 | 1137 | struct net_device_context *net_device_ctx = netdev_priv(ndev); |
f3dd3f47 | 1138 | struct nvsp_message *nvmsg = hv_pkt_data(desc); |
99a50bb1 S |
1139 | |
1140 | switch (desc->type) { | |
1141 | case VM_PKT_COMP: | |
f9645430 | 1142 | netvsc_send_completion(net_device, channel, device, |
1143 | desc, budget); | |
99a50bb1 S |
1144 | break; |
1145 | ||
1146 | case VM_PKT_DATA_USING_XFER_PAGES: | |
15a863bf | 1147 | return netvsc_receive(ndev, net_device, net_device_ctx, |
1148 | device, channel, desc, nvmsg); | |
99a50bb1 S |
1149 | break; |
1150 | ||
1151 | case VM_PKT_DATA_INBAND: | |
f9a7da91 | 1152 | netvsc_receive_inband(device, net_device_ctx, nvmsg); |
99a50bb1 S |
1153 | break; |
1154 | ||
1155 | default: | |
1156 | netdev_err(ndev, "unhandled packet type %d, tid %llx\n", | |
f4f1c23d | 1157 | desc->type, desc->trans_id); |
99a50bb1 S |
1158 | break; |
1159 | } | |
15a863bf | 1160 | |
1161 | return 0; | |
1162 | } | |
1163 | ||
1164 | static struct hv_device *netvsc_channel_to_device(struct vmbus_channel *channel) | |
1165 | { | |
1166 | struct vmbus_channel *primary = channel->primary_channel; | |
1167 | ||
1168 | return primary ? primary->device_obj : channel->device_obj; | |
1169 | } | |
1170 | ||
262b7f14 | 1171 | /* Network processing softirq |
1172 | * Process data in incoming ring buffer from host | |
1173 | * Stops when ring is empty or budget is met or exceeded. | |
1174 | */ | |
15a863bf | 1175 | int netvsc_poll(struct napi_struct *napi, int budget) |
1176 | { | |
1177 | struct netvsc_channel *nvchan | |
1178 | = container_of(napi, struct netvsc_channel, napi); | |
35fbbccf | 1179 | struct netvsc_device *net_device = nvchan->net_device; |
15a863bf | 1180 | struct vmbus_channel *channel = nvchan->channel; |
1181 | struct hv_device *device = netvsc_channel_to_device(channel); | |
15a863bf | 1182 | struct net_device *ndev = hv_get_drvdata(device); |
15a863bf | 1183 | int work_done = 0; |
1184 | ||
f4f1c23d | 1185 | /* If starting a new interval */ |
1186 | if (!nvchan->desc) | |
1187 | nvchan->desc = hv_pkt_iter_first(channel); | |
15a863bf | 1188 | |
f4f1c23d | 1189 | while (nvchan->desc && work_done < budget) { |
1190 | work_done += netvsc_process_raw_pkt(device, channel, net_device, | |
f9645430 | 1191 | ndev, nvchan->desc, budget); |
f4f1c23d | 1192 | nvchan->desc = hv_pkt_iter_next(channel, nvchan->desc); |
15a863bf | 1193 | } |
15a863bf | 1194 | |
f4e40363 | 1195 | /* If send of pending receive completions suceeded |
1196 | * and did not exhaust NAPI budget this time | |
7426b1a5 | 1197 | * and not doing busy poll |
f4e40363 | 1198 | * then re-enable host interrupts |
1199 | * and reschedule if ring is not empty. | |
262b7f14 | 1200 | */ |
cad5c197 | 1201 | if (send_recv_completions(ndev, net_device, nvchan) == 0 && |
7426b1a5 | 1202 | work_done < budget && |
15a863bf | 1203 | napi_complete_done(napi, work_done) && |
7426b1a5 | 1204 | hv_end_read(&channel->inbound)) { |
1205 | hv_begin_read(&channel->inbound); | |
15a863bf | 1206 | napi_reschedule(napi); |
7426b1a5 | 1207 | } |
f4f1c23d | 1208 | |
1209 | /* Driver may overshoot since multiple packets per descriptor */ | |
1210 | return min(work_done, budget); | |
99a50bb1 S |
1211 | } |
1212 | ||
262b7f14 | 1213 | /* Call back when data is available in host ring buffer. |
1214 | * Processing is deferred until network softirq (NAPI) | |
1215 | */ | |
5b54dac8 | 1216 | void netvsc_channel_cb(void *context) |
fceaf24a | 1217 | { |
6de38af6 | 1218 | struct netvsc_channel *nvchan = context; |
43bf99ce | 1219 | struct vmbus_channel *channel = nvchan->channel; |
1220 | struct hv_ring_buffer_info *rbi = &channel->inbound; | |
1221 | ||
1222 | /* preload first vmpacket descriptor */ | |
1223 | prefetch(hv_get_ring_buffer(rbi) + rbi->priv_read_index); | |
0b307ebd | 1224 | |
f4f1c23d | 1225 | if (napi_schedule_prep(&nvchan->napi)) { |
1226 | /* disable interupts from host */ | |
43bf99ce | 1227 | hv_begin_read(rbi); |
0d6dd357 | 1228 | |
f4f1c23d | 1229 | __napi_schedule(&nvchan->napi); |
1230 | } | |
fceaf24a | 1231 | } |
af24ce42 | 1232 | |
b637e023 HZ |
1233 | /* |
1234 | * netvsc_device_add - Callback when the device belonging to this | |
1235 | * driver is added | |
1236 | */ | |
9749fed5 | 1237 | struct netvsc_device *netvsc_device_add(struct hv_device *device, |
1238 | const struct netvsc_device_info *device_info) | |
b637e023 | 1239 | { |
88098834 | 1240 | int i, ret = 0; |
2c7f83ca | 1241 | int ring_size = device_info->ring_size; |
b637e023 | 1242 | struct netvsc_device *net_device; |
88098834 VK |
1243 | struct net_device *ndev = hv_get_drvdata(device); |
1244 | struct net_device_context *net_device_ctx = netdev_priv(ndev); | |
b637e023 | 1245 | |
88098834 | 1246 | net_device = alloc_net_device(); |
b1c84927 | 1247 | if (!net_device) |
9749fed5 | 1248 | return ERR_PTR(-ENOMEM); |
b637e023 | 1249 | |
5b54dac8 HZ |
1250 | net_device->ring_size = ring_size; |
1251 | ||
15a863bf | 1252 | /* Because the device uses NAPI, all the interrupt batching and |
1253 | * control is done via Net softirq, not the channel handling | |
1254 | */ | |
1255 | set_channel_read_mode(device->channel, HV_CALL_ISR); | |
1256 | ||
bffb1842 S |
1257 | /* If we're reopening the device we may have multiple queues, fill the |
1258 | * chn_table with the default channel to use it before subchannels are | |
1259 | * opened. | |
1260 | * Initialize the channel state before we open; | |
1261 | * we can be interrupted as soon as we open the channel. | |
1262 | */ | |
1263 | ||
1264 | for (i = 0; i < VRSS_CHANNEL_MAX; i++) { | |
1265 | struct netvsc_channel *nvchan = &net_device->chan_table[i]; | |
1266 | ||
1267 | nvchan->channel = device->channel; | |
35fbbccf | 1268 | nvchan->net_device = net_device; |
4a0dee1f FF |
1269 | u64_stats_init(&nvchan->tx_stats.syncp); |
1270 | u64_stats_init(&nvchan->rx_stats.syncp); | |
bffb1842 S |
1271 | } |
1272 | ||
2be0f264 | 1273 | /* Enable NAPI handler before init callbacks */ |
1274 | netif_napi_add(ndev, &net_device->chan_table[0].napi, | |
1275 | netvsc_poll, NAPI_POLL_WEIGHT); | |
1276 | ||
b637e023 | 1277 | /* Open the channel */ |
aae23986 S |
1278 | ret = vmbus_open(device->channel, ring_size * PAGE_SIZE, |
1279 | ring_size * PAGE_SIZE, NULL, 0, | |
6de38af6 | 1280 | netvsc_channel_cb, |
1281 | net_device->chan_table); | |
b637e023 HZ |
1282 | |
1283 | if (ret != 0) { | |
2be0f264 | 1284 | netif_napi_del(&net_device->chan_table[0].napi); |
d9871158 | 1285 | netdev_err(ndev, "unable to open channel: %d\n", ret); |
b637e023 HZ |
1286 | goto cleanup; |
1287 | } | |
1288 | ||
1289 | /* Channel is opened */ | |
93ba2222 | 1290 | netdev_dbg(ndev, "hv_netvsc channel opened successfully\n"); |
b637e023 | 1291 | |
15a863bf | 1292 | napi_enable(&net_device->chan_table[0].napi); |
88098834 VK |
1293 | |
1294 | /* Writing nvdev pointer unlocks netvsc_send(), make sure chn_table is | |
1295 | * populated. | |
1296 | */ | |
545a8e79 | 1297 | rcu_assign_pointer(net_device_ctx->nvdev, net_device); |
5b54dac8 | 1298 | |
b637e023 | 1299 | /* Connect with the NetVsp */ |
8b532797 | 1300 | ret = netvsc_connect_vsp(device, net_device, device_info); |
b637e023 | 1301 | if (ret != 0) { |
d9871158 | 1302 | netdev_err(ndev, |
c909ebbd | 1303 | "unable to connect to NetVSP - %d\n", ret); |
b637e023 HZ |
1304 | goto close; |
1305 | } | |
1306 | ||
9749fed5 | 1307 | return net_device; |
b637e023 HZ |
1308 | |
1309 | close: | |
49393347 | 1310 | RCU_INIT_POINTER(net_device_ctx->nvdev, NULL); |
1311 | napi_disable(&net_device->chan_table[0].napi); | |
15a863bf | 1312 | |
b637e023 HZ |
1313 | /* Now, we can close the channel safely */ |
1314 | vmbus_close(device->channel); | |
1315 | ||
1316 | cleanup: | |
545a8e79 | 1317 | free_netvsc_device(&net_device->rcu); |
b637e023 | 1318 | |
9749fed5 | 1319 | return ERR_PTR(ret); |
b637e023 | 1320 | } |