]> git.proxmox.com Git - mirror_ubuntu-bionic-kernel.git/blob - drivers/hv/channel_mgmt.c
Merge tag 'armsoc-drivers' of git://git.kernel.org/pub/scm/linux/kernel/git/arm/arm-soc
[mirror_ubuntu-bionic-kernel.git] / drivers / hv / channel_mgmt.c
1 /*
2 * Copyright (c) 2009, Microsoft Corporation.
3 *
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms and conditions of the GNU General Public License,
6 * version 2, as published by the Free Software Foundation.
7 *
8 * This program is distributed in the hope it will be useful, but WITHOUT
9 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
11 * more details.
12 *
13 * You should have received a copy of the GNU General Public License along with
14 * this program; if not, write to the Free Software Foundation, Inc., 59 Temple
15 * Place - Suite 330, Boston, MA 02111-1307 USA.
16 *
17 * Authors:
18 * Haiyang Zhang <haiyangz@microsoft.com>
19 * Hank Janssen <hjanssen@microsoft.com>
20 */
21 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
22
23 #include <linux/kernel.h>
24 #include <linux/interrupt.h>
25 #include <linux/sched.h>
26 #include <linux/wait.h>
27 #include <linux/mm.h>
28 #include <linux/slab.h>
29 #include <linux/list.h>
30 #include <linux/module.h>
31 #include <linux/completion.h>
32 #include <linux/delay.h>
33 #include <linux/hyperv.h>
34
35 #include "hyperv_vmbus.h"
36
37 static void init_vp_index(struct vmbus_channel *channel, u16 dev_type);
38
39 static const struct vmbus_device vmbus_devs[] = {
40 /* IDE */
41 { .dev_type = HV_IDE,
42 HV_IDE_GUID,
43 .perf_device = true,
44 },
45
46 /* SCSI */
47 { .dev_type = HV_SCSI,
48 HV_SCSI_GUID,
49 .perf_device = true,
50 },
51
52 /* Fibre Channel */
53 { .dev_type = HV_FC,
54 HV_SYNTHFC_GUID,
55 .perf_device = true,
56 },
57
58 /* Synthetic NIC */
59 { .dev_type = HV_NIC,
60 HV_NIC_GUID,
61 .perf_device = true,
62 },
63
64 /* Network Direct */
65 { .dev_type = HV_ND,
66 HV_ND_GUID,
67 .perf_device = true,
68 },
69
70 /* PCIE */
71 { .dev_type = HV_PCIE,
72 HV_PCIE_GUID,
73 .perf_device = true,
74 },
75
76 /* Synthetic Frame Buffer */
77 { .dev_type = HV_FB,
78 HV_SYNTHVID_GUID,
79 .perf_device = false,
80 },
81
82 /* Synthetic Keyboard */
83 { .dev_type = HV_KBD,
84 HV_KBD_GUID,
85 .perf_device = false,
86 },
87
88 /* Synthetic MOUSE */
89 { .dev_type = HV_MOUSE,
90 HV_MOUSE_GUID,
91 .perf_device = false,
92 },
93
94 /* KVP */
95 { .dev_type = HV_KVP,
96 HV_KVP_GUID,
97 .perf_device = false,
98 },
99
100 /* Time Synch */
101 { .dev_type = HV_TS,
102 HV_TS_GUID,
103 .perf_device = false,
104 },
105
106 /* Heartbeat */
107 { .dev_type = HV_HB,
108 HV_HEART_BEAT_GUID,
109 .perf_device = false,
110 },
111
112 /* Shutdown */
113 { .dev_type = HV_SHUTDOWN,
114 HV_SHUTDOWN_GUID,
115 .perf_device = false,
116 },
117
118 /* File copy */
119 { .dev_type = HV_FCOPY,
120 HV_FCOPY_GUID,
121 .perf_device = false,
122 },
123
124 /* Backup */
125 { .dev_type = HV_BACKUP,
126 HV_VSS_GUID,
127 .perf_device = false,
128 },
129
130 /* Dynamic Memory */
131 { .dev_type = HV_DM,
132 HV_DM_GUID,
133 .perf_device = false,
134 },
135
136 /* Unknown GUID */
137 { .dev_type = HV_UNKNOWN,
138 .perf_device = false,
139 },
140 };
141
142 static const struct {
143 uuid_le guid;
144 } vmbus_unsupported_devs[] = {
145 { HV_AVMA1_GUID },
146 { HV_AVMA2_GUID },
147 { HV_RDV_GUID },
148 };
149
150 static bool is_unsupported_vmbus_devs(const uuid_le *guid)
151 {
152 int i;
153
154 for (i = 0; i < ARRAY_SIZE(vmbus_unsupported_devs); i++)
155 if (!uuid_le_cmp(*guid, vmbus_unsupported_devs[i].guid))
156 return true;
157 return false;
158 }
159
160 static u16 hv_get_dev_type(const struct vmbus_channel *channel)
161 {
162 const uuid_le *guid = &channel->offermsg.offer.if_type;
163 u16 i;
164
165 if (is_hvsock_channel(channel) || is_unsupported_vmbus_devs(guid))
166 return HV_UNKNOWN;
167
168 for (i = HV_IDE; i < HV_UNKNOWN; i++) {
169 if (!uuid_le_cmp(*guid, vmbus_devs[i].guid))
170 return i;
171 }
172 pr_info("Unknown GUID: %pUl\n", guid);
173 return i;
174 }
175
176 /**
177 * vmbus_prep_negotiate_resp() - Create default response for Hyper-V Negotiate message
178 * @icmsghdrp: Pointer to msg header structure
179 * @icmsg_negotiate: Pointer to negotiate message structure
180 * @buf: Raw buffer channel data
181 *
182 * @icmsghdrp is of type &struct icmsg_hdr.
183 * @negop is of type &struct icmsg_negotiate.
184 * Set up and fill in default negotiate response message.
185 *
186 * The fw_version specifies the framework version that
187 * we can support and srv_version specifies the service
188 * version we can support.
189 *
190 * Mainly used by Hyper-V drivers.
191 */
192 bool vmbus_prep_negotiate_resp(struct icmsg_hdr *icmsghdrp,
193 struct icmsg_negotiate *negop, u8 *buf,
194 int fw_version, int srv_version)
195 {
196 int icframe_major, icframe_minor;
197 int icmsg_major, icmsg_minor;
198 int fw_major, fw_minor;
199 int srv_major, srv_minor;
200 int i;
201 bool found_match = false;
202
203 icmsghdrp->icmsgsize = 0x10;
204 fw_major = (fw_version >> 16);
205 fw_minor = (fw_version & 0xFFFF);
206
207 srv_major = (srv_version >> 16);
208 srv_minor = (srv_version & 0xFFFF);
209
210 negop = (struct icmsg_negotiate *)&buf[
211 sizeof(struct vmbuspipe_hdr) +
212 sizeof(struct icmsg_hdr)];
213
214 icframe_major = negop->icframe_vercnt;
215 icframe_minor = 0;
216
217 icmsg_major = negop->icmsg_vercnt;
218 icmsg_minor = 0;
219
220 /*
221 * Select the framework version number we will
222 * support.
223 */
224
225 for (i = 0; i < negop->icframe_vercnt; i++) {
226 if ((negop->icversion_data[i].major == fw_major) &&
227 (negop->icversion_data[i].minor == fw_minor)) {
228 icframe_major = negop->icversion_data[i].major;
229 icframe_minor = negop->icversion_data[i].minor;
230 found_match = true;
231 }
232 }
233
234 if (!found_match)
235 goto fw_error;
236
237 found_match = false;
238
239 for (i = negop->icframe_vercnt;
240 (i < negop->icframe_vercnt + negop->icmsg_vercnt); i++) {
241 if ((negop->icversion_data[i].major == srv_major) &&
242 (negop->icversion_data[i].minor == srv_minor)) {
243 icmsg_major = negop->icversion_data[i].major;
244 icmsg_minor = negop->icversion_data[i].minor;
245 found_match = true;
246 }
247 }
248
249 /*
250 * Respond with the framework and service
251 * version numbers we can support.
252 */
253
254 fw_error:
255 if (!found_match) {
256 negop->icframe_vercnt = 0;
257 negop->icmsg_vercnt = 0;
258 } else {
259 negop->icframe_vercnt = 1;
260 negop->icmsg_vercnt = 1;
261 }
262
263 negop->icversion_data[0].major = icframe_major;
264 negop->icversion_data[0].minor = icframe_minor;
265 negop->icversion_data[1].major = icmsg_major;
266 negop->icversion_data[1].minor = icmsg_minor;
267 return found_match;
268 }
269
270 EXPORT_SYMBOL_GPL(vmbus_prep_negotiate_resp);
271
272 /*
273 * alloc_channel - Allocate and initialize a vmbus channel object
274 */
275 static struct vmbus_channel *alloc_channel(void)
276 {
277 struct vmbus_channel *channel;
278
279 channel = kzalloc(sizeof(*channel), GFP_ATOMIC);
280 if (!channel)
281 return NULL;
282
283 channel->acquire_ring_lock = true;
284 spin_lock_init(&channel->inbound_lock);
285 spin_lock_init(&channel->lock);
286
287 INIT_LIST_HEAD(&channel->sc_list);
288 INIT_LIST_HEAD(&channel->percpu_list);
289
290 return channel;
291 }
292
293 /*
294 * free_channel - Release the resources used by the vmbus channel object
295 */
296 static void free_channel(struct vmbus_channel *channel)
297 {
298 kfree(channel);
299 }
300
301 static void percpu_channel_enq(void *arg)
302 {
303 struct vmbus_channel *channel = arg;
304 int cpu = smp_processor_id();
305
306 list_add_tail(&channel->percpu_list, &hv_context.percpu_list[cpu]);
307 }
308
309 static void percpu_channel_deq(void *arg)
310 {
311 struct vmbus_channel *channel = arg;
312
313 list_del(&channel->percpu_list);
314 }
315
316
317 static void vmbus_release_relid(u32 relid)
318 {
319 struct vmbus_channel_relid_released msg;
320
321 memset(&msg, 0, sizeof(struct vmbus_channel_relid_released));
322 msg.child_relid = relid;
323 msg.header.msgtype = CHANNELMSG_RELID_RELEASED;
324 vmbus_post_msg(&msg, sizeof(struct vmbus_channel_relid_released));
325 }
326
327 void hv_event_tasklet_disable(struct vmbus_channel *channel)
328 {
329 struct tasklet_struct *tasklet;
330 tasklet = hv_context.event_dpc[channel->target_cpu];
331 tasklet_disable(tasklet);
332 }
333
334 void hv_event_tasklet_enable(struct vmbus_channel *channel)
335 {
336 struct tasklet_struct *tasklet;
337 tasklet = hv_context.event_dpc[channel->target_cpu];
338 tasklet_enable(tasklet);
339
340 /* In case there is any pending event */
341 tasklet_schedule(tasklet);
342 }
343
344 void hv_process_channel_removal(struct vmbus_channel *channel, u32 relid)
345 {
346 unsigned long flags;
347 struct vmbus_channel *primary_channel;
348
349 BUG_ON(!channel->rescind);
350 BUG_ON(!mutex_is_locked(&vmbus_connection.channel_mutex));
351
352 hv_event_tasklet_disable(channel);
353 if (channel->target_cpu != get_cpu()) {
354 put_cpu();
355 smp_call_function_single(channel->target_cpu,
356 percpu_channel_deq, channel, true);
357 } else {
358 percpu_channel_deq(channel);
359 put_cpu();
360 }
361 hv_event_tasklet_enable(channel);
362
363 if (channel->primary_channel == NULL) {
364 list_del(&channel->listentry);
365
366 primary_channel = channel;
367 } else {
368 primary_channel = channel->primary_channel;
369 spin_lock_irqsave(&primary_channel->lock, flags);
370 list_del(&channel->sc_list);
371 primary_channel->num_sc--;
372 spin_unlock_irqrestore(&primary_channel->lock, flags);
373 }
374
375 /*
376 * We need to free the bit for init_vp_index() to work in the case
377 * of sub-channel, when we reload drivers like hv_netvsc.
378 */
379 if (channel->affinity_policy == HV_LOCALIZED)
380 cpumask_clear_cpu(channel->target_cpu,
381 &primary_channel->alloced_cpus_in_node);
382
383 vmbus_release_relid(relid);
384
385 free_channel(channel);
386 }
387
388 void vmbus_free_channels(void)
389 {
390 struct vmbus_channel *channel, *tmp;
391
392 mutex_lock(&vmbus_connection.channel_mutex);
393 list_for_each_entry_safe(channel, tmp, &vmbus_connection.chn_list,
394 listentry) {
395 /* hv_process_channel_removal() needs this */
396 channel->rescind = true;
397
398 vmbus_device_unregister(channel->device_obj);
399 }
400 mutex_unlock(&vmbus_connection.channel_mutex);
401 }
402
403 /*
404 * vmbus_process_offer - Process the offer by creating a channel/device
405 * associated with this offer
406 */
407 static void vmbus_process_offer(struct vmbus_channel *newchannel)
408 {
409 struct vmbus_channel *channel;
410 bool fnew = true;
411 unsigned long flags;
412 u16 dev_type;
413 int ret;
414
415 /* Make sure this is a new offer */
416 mutex_lock(&vmbus_connection.channel_mutex);
417
418 list_for_each_entry(channel, &vmbus_connection.chn_list, listentry) {
419 if (!uuid_le_cmp(channel->offermsg.offer.if_type,
420 newchannel->offermsg.offer.if_type) &&
421 !uuid_le_cmp(channel->offermsg.offer.if_instance,
422 newchannel->offermsg.offer.if_instance)) {
423 fnew = false;
424 break;
425 }
426 }
427
428 if (fnew)
429 list_add_tail(&newchannel->listentry,
430 &vmbus_connection.chn_list);
431
432 mutex_unlock(&vmbus_connection.channel_mutex);
433
434 if (!fnew) {
435 /*
436 * Check to see if this is a sub-channel.
437 */
438 if (newchannel->offermsg.offer.sub_channel_index != 0) {
439 /*
440 * Process the sub-channel.
441 */
442 newchannel->primary_channel = channel;
443 spin_lock_irqsave(&channel->lock, flags);
444 list_add_tail(&newchannel->sc_list, &channel->sc_list);
445 channel->num_sc++;
446 spin_unlock_irqrestore(&channel->lock, flags);
447 } else
448 goto err_free_chan;
449 }
450
451 dev_type = hv_get_dev_type(newchannel);
452
453 init_vp_index(newchannel, dev_type);
454
455 hv_event_tasklet_disable(newchannel);
456 if (newchannel->target_cpu != get_cpu()) {
457 put_cpu();
458 smp_call_function_single(newchannel->target_cpu,
459 percpu_channel_enq,
460 newchannel, true);
461 } else {
462 percpu_channel_enq(newchannel);
463 put_cpu();
464 }
465 hv_event_tasklet_enable(newchannel);
466
467 /*
468 * This state is used to indicate a successful open
469 * so that when we do close the channel normally, we
470 * can cleanup properly
471 */
472 newchannel->state = CHANNEL_OPEN_STATE;
473
474 if (!fnew) {
475 if (channel->sc_creation_callback != NULL)
476 channel->sc_creation_callback(newchannel);
477 return;
478 }
479
480 /*
481 * Start the process of binding this offer to the driver
482 * We need to set the DeviceObject field before calling
483 * vmbus_child_dev_add()
484 */
485 newchannel->device_obj = vmbus_device_create(
486 &newchannel->offermsg.offer.if_type,
487 &newchannel->offermsg.offer.if_instance,
488 newchannel);
489 if (!newchannel->device_obj)
490 goto err_deq_chan;
491
492 newchannel->device_obj->device_id = dev_type;
493 /*
494 * Add the new device to the bus. This will kick off device-driver
495 * binding which eventually invokes the device driver's AddDevice()
496 * method.
497 */
498 mutex_lock(&vmbus_connection.channel_mutex);
499 ret = vmbus_device_register(newchannel->device_obj);
500 mutex_unlock(&vmbus_connection.channel_mutex);
501
502 if (ret != 0) {
503 pr_err("unable to add child device object (relid %d)\n",
504 newchannel->offermsg.child_relid);
505 kfree(newchannel->device_obj);
506 goto err_deq_chan;
507 }
508 return;
509
510 err_deq_chan:
511 mutex_lock(&vmbus_connection.channel_mutex);
512 list_del(&newchannel->listentry);
513 mutex_unlock(&vmbus_connection.channel_mutex);
514
515 hv_event_tasklet_disable(newchannel);
516 if (newchannel->target_cpu != get_cpu()) {
517 put_cpu();
518 smp_call_function_single(newchannel->target_cpu,
519 percpu_channel_deq, newchannel, true);
520 } else {
521 percpu_channel_deq(newchannel);
522 put_cpu();
523 }
524 hv_event_tasklet_enable(newchannel);
525
526 vmbus_release_relid(newchannel->offermsg.child_relid);
527
528 err_free_chan:
529 free_channel(newchannel);
530 }
531
532 /*
533 * We use this state to statically distribute the channel interrupt load.
534 */
535 static int next_numa_node_id;
536
537 /*
538 * Starting with Win8, we can statically distribute the incoming
539 * channel interrupt load by binding a channel to VCPU.
540 * We do this in a hierarchical fashion:
541 * First distribute the primary channels across available NUMA nodes
542 * and then distribute the subchannels amongst the CPUs in the NUMA
543 * node assigned to the primary channel.
544 *
545 * For pre-win8 hosts or non-performance critical channels we assign the
546 * first CPU in the first NUMA node.
547 */
548 static void init_vp_index(struct vmbus_channel *channel, u16 dev_type)
549 {
550 u32 cur_cpu;
551 bool perf_chn = vmbus_devs[dev_type].perf_device;
552 struct vmbus_channel *primary = channel->primary_channel;
553 int next_node;
554 struct cpumask available_mask;
555 struct cpumask *alloced_mask;
556
557 if ((vmbus_proto_version == VERSION_WS2008) ||
558 (vmbus_proto_version == VERSION_WIN7) || (!perf_chn)) {
559 /*
560 * Prior to win8, all channel interrupts are
561 * delivered on cpu 0.
562 * Also if the channel is not a performance critical
563 * channel, bind it to cpu 0.
564 */
565 channel->numa_node = 0;
566 channel->target_cpu = 0;
567 channel->target_vp = hv_context.vp_index[0];
568 return;
569 }
570
571 /*
572 * Based on the channel affinity policy, we will assign the NUMA
573 * nodes.
574 */
575
576 if ((channel->affinity_policy == HV_BALANCED) || (!primary)) {
577 while (true) {
578 next_node = next_numa_node_id++;
579 if (next_node == nr_node_ids) {
580 next_node = next_numa_node_id = 0;
581 continue;
582 }
583 if (cpumask_empty(cpumask_of_node(next_node)))
584 continue;
585 break;
586 }
587 channel->numa_node = next_node;
588 primary = channel;
589 }
590 alloced_mask = &hv_context.hv_numa_map[primary->numa_node];
591
592 if (cpumask_weight(alloced_mask) ==
593 cpumask_weight(cpumask_of_node(primary->numa_node))) {
594 /*
595 * We have cycled through all the CPUs in the node;
596 * reset the alloced map.
597 */
598 cpumask_clear(alloced_mask);
599 }
600
601 cpumask_xor(&available_mask, alloced_mask,
602 cpumask_of_node(primary->numa_node));
603
604 cur_cpu = -1;
605
606 if (primary->affinity_policy == HV_LOCALIZED) {
607 /*
608 * Normally Hyper-V host doesn't create more subchannels
609 * than there are VCPUs on the node but it is possible when not
610 * all present VCPUs on the node are initialized by guest.
611 * Clear the alloced_cpus_in_node to start over.
612 */
613 if (cpumask_equal(&primary->alloced_cpus_in_node,
614 cpumask_of_node(primary->numa_node)))
615 cpumask_clear(&primary->alloced_cpus_in_node);
616 }
617
618 while (true) {
619 cur_cpu = cpumask_next(cur_cpu, &available_mask);
620 if (cur_cpu >= nr_cpu_ids) {
621 cur_cpu = -1;
622 cpumask_copy(&available_mask,
623 cpumask_of_node(primary->numa_node));
624 continue;
625 }
626
627 if (primary->affinity_policy == HV_LOCALIZED) {
628 /*
629 * NOTE: in the case of sub-channel, we clear the
630 * sub-channel related bit(s) in
631 * primary->alloced_cpus_in_node in
632 * hv_process_channel_removal(), so when we
633 * reload drivers like hv_netvsc in SMP guest, here
634 * we're able to re-allocate
635 * bit from primary->alloced_cpus_in_node.
636 */
637 if (!cpumask_test_cpu(cur_cpu,
638 &primary->alloced_cpus_in_node)) {
639 cpumask_set_cpu(cur_cpu,
640 &primary->alloced_cpus_in_node);
641 cpumask_set_cpu(cur_cpu, alloced_mask);
642 break;
643 }
644 } else {
645 cpumask_set_cpu(cur_cpu, alloced_mask);
646 break;
647 }
648 }
649
650 channel->target_cpu = cur_cpu;
651 channel->target_vp = hv_context.vp_index[cur_cpu];
652 }
653
654 static void vmbus_wait_for_unload(void)
655 {
656 int cpu;
657 void *page_addr;
658 struct hv_message *msg;
659 struct vmbus_channel_message_header *hdr;
660 u32 message_type;
661
662 /*
663 * CHANNELMSG_UNLOAD_RESPONSE is always delivered to the CPU which was
664 * used for initial contact or to CPU0 depending on host version. When
665 * we're crashing on a different CPU let's hope that IRQ handler on
666 * the cpu which receives CHANNELMSG_UNLOAD_RESPONSE is still
667 * functional and vmbus_unload_response() will complete
668 * vmbus_connection.unload_event. If not, the last thing we can do is
669 * read message pages for all CPUs directly.
670 */
671 while (1) {
672 if (completion_done(&vmbus_connection.unload_event))
673 break;
674
675 for_each_online_cpu(cpu) {
676 page_addr = hv_context.synic_message_page[cpu];
677 msg = (struct hv_message *)page_addr +
678 VMBUS_MESSAGE_SINT;
679
680 message_type = READ_ONCE(msg->header.message_type);
681 if (message_type == HVMSG_NONE)
682 continue;
683
684 hdr = (struct vmbus_channel_message_header *)
685 msg->u.payload;
686
687 if (hdr->msgtype == CHANNELMSG_UNLOAD_RESPONSE)
688 complete(&vmbus_connection.unload_event);
689
690 vmbus_signal_eom(msg, message_type);
691 }
692
693 mdelay(10);
694 }
695
696 /*
697 * We're crashing and already got the UNLOAD_RESPONSE, cleanup all
698 * maybe-pending messages on all CPUs to be able to receive new
699 * messages after we reconnect.
700 */
701 for_each_online_cpu(cpu) {
702 page_addr = hv_context.synic_message_page[cpu];
703 msg = (struct hv_message *)page_addr + VMBUS_MESSAGE_SINT;
704 msg->header.message_type = HVMSG_NONE;
705 }
706 }
707
708 /*
709 * vmbus_unload_response - Handler for the unload response.
710 */
711 static void vmbus_unload_response(struct vmbus_channel_message_header *hdr)
712 {
713 /*
714 * This is a global event; just wakeup the waiting thread.
715 * Once we successfully unload, we can cleanup the monitor state.
716 */
717 complete(&vmbus_connection.unload_event);
718 }
719
720 void vmbus_initiate_unload(bool crash)
721 {
722 struct vmbus_channel_message_header hdr;
723
724 /* Pre-Win2012R2 hosts don't support reconnect */
725 if (vmbus_proto_version < VERSION_WIN8_1)
726 return;
727
728 init_completion(&vmbus_connection.unload_event);
729 memset(&hdr, 0, sizeof(struct vmbus_channel_message_header));
730 hdr.msgtype = CHANNELMSG_UNLOAD;
731 vmbus_post_msg(&hdr, sizeof(struct vmbus_channel_message_header));
732
733 /*
734 * vmbus_initiate_unload() is also called on crash and the crash can be
735 * happening in an interrupt context, where scheduling is impossible.
736 */
737 if (!crash)
738 wait_for_completion(&vmbus_connection.unload_event);
739 else
740 vmbus_wait_for_unload();
741 }
742
743 /*
744 * vmbus_onoffer - Handler for channel offers from vmbus in parent partition.
745 *
746 */
747 static void vmbus_onoffer(struct vmbus_channel_message_header *hdr)
748 {
749 struct vmbus_channel_offer_channel *offer;
750 struct vmbus_channel *newchannel;
751
752 offer = (struct vmbus_channel_offer_channel *)hdr;
753
754 /* Allocate the channel object and save this offer. */
755 newchannel = alloc_channel();
756 if (!newchannel) {
757 pr_err("Unable to allocate channel object\n");
758 return;
759 }
760
761 /*
762 * By default we setup state to enable batched
763 * reading. A specific service can choose to
764 * disable this prior to opening the channel.
765 */
766 newchannel->batched_reading = true;
767
768 /*
769 * Setup state for signalling the host.
770 */
771 newchannel->sig_event = (struct hv_input_signal_event *)
772 (ALIGN((unsigned long)
773 &newchannel->sig_buf,
774 HV_HYPERCALL_PARAM_ALIGN));
775
776 newchannel->sig_event->connectionid.asu32 = 0;
777 newchannel->sig_event->connectionid.u.id = VMBUS_EVENT_CONNECTION_ID;
778 newchannel->sig_event->flag_number = 0;
779 newchannel->sig_event->rsvdz = 0;
780
781 if (vmbus_proto_version != VERSION_WS2008) {
782 newchannel->is_dedicated_interrupt =
783 (offer->is_dedicated_interrupt != 0);
784 newchannel->sig_event->connectionid.u.id =
785 offer->connection_id;
786 }
787
788 memcpy(&newchannel->offermsg, offer,
789 sizeof(struct vmbus_channel_offer_channel));
790 newchannel->monitor_grp = (u8)offer->monitorid / 32;
791 newchannel->monitor_bit = (u8)offer->monitorid % 32;
792
793 vmbus_process_offer(newchannel);
794 }
795
796 /*
797 * vmbus_onoffer_rescind - Rescind offer handler.
798 *
799 * We queue a work item to process this offer synchronously
800 */
801 static void vmbus_onoffer_rescind(struct vmbus_channel_message_header *hdr)
802 {
803 struct vmbus_channel_rescind_offer *rescind;
804 struct vmbus_channel *channel;
805 unsigned long flags;
806 struct device *dev;
807
808 rescind = (struct vmbus_channel_rescind_offer *)hdr;
809
810 mutex_lock(&vmbus_connection.channel_mutex);
811 channel = relid2channel(rescind->child_relid);
812
813 if (channel == NULL) {
814 /*
815 * This is very impossible, because in
816 * vmbus_process_offer(), we have already invoked
817 * vmbus_release_relid() on error.
818 */
819 goto out;
820 }
821
822 spin_lock_irqsave(&channel->lock, flags);
823 channel->rescind = true;
824 spin_unlock_irqrestore(&channel->lock, flags);
825
826 if (channel->device_obj) {
827 if (channel->chn_rescind_callback) {
828 channel->chn_rescind_callback(channel);
829 goto out;
830 }
831 /*
832 * We will have to unregister this device from the
833 * driver core.
834 */
835 dev = get_device(&channel->device_obj->device);
836 if (dev) {
837 vmbus_device_unregister(channel->device_obj);
838 put_device(dev);
839 }
840 } else {
841 hv_process_channel_removal(channel,
842 channel->offermsg.child_relid);
843 }
844
845 out:
846 mutex_unlock(&vmbus_connection.channel_mutex);
847 }
848
849 void vmbus_hvsock_device_unregister(struct vmbus_channel *channel)
850 {
851 mutex_lock(&vmbus_connection.channel_mutex);
852
853 BUG_ON(!is_hvsock_channel(channel));
854
855 channel->rescind = true;
856 vmbus_device_unregister(channel->device_obj);
857
858 mutex_unlock(&vmbus_connection.channel_mutex);
859 }
860 EXPORT_SYMBOL_GPL(vmbus_hvsock_device_unregister);
861
862
863 /*
864 * vmbus_onoffers_delivered -
865 * This is invoked when all offers have been delivered.
866 *
867 * Nothing to do here.
868 */
869 static void vmbus_onoffers_delivered(
870 struct vmbus_channel_message_header *hdr)
871 {
872 }
873
874 /*
875 * vmbus_onopen_result - Open result handler.
876 *
877 * This is invoked when we received a response to our channel open request.
878 * Find the matching request, copy the response and signal the requesting
879 * thread.
880 */
881 static void vmbus_onopen_result(struct vmbus_channel_message_header *hdr)
882 {
883 struct vmbus_channel_open_result *result;
884 struct vmbus_channel_msginfo *msginfo;
885 struct vmbus_channel_message_header *requestheader;
886 struct vmbus_channel_open_channel *openmsg;
887 unsigned long flags;
888
889 result = (struct vmbus_channel_open_result *)hdr;
890
891 /*
892 * Find the open msg, copy the result and signal/unblock the wait event
893 */
894 spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
895
896 list_for_each_entry(msginfo, &vmbus_connection.chn_msg_list,
897 msglistentry) {
898 requestheader =
899 (struct vmbus_channel_message_header *)msginfo->msg;
900
901 if (requestheader->msgtype == CHANNELMSG_OPENCHANNEL) {
902 openmsg =
903 (struct vmbus_channel_open_channel *)msginfo->msg;
904 if (openmsg->child_relid == result->child_relid &&
905 openmsg->openid == result->openid) {
906 memcpy(&msginfo->response.open_result,
907 result,
908 sizeof(
909 struct vmbus_channel_open_result));
910 complete(&msginfo->waitevent);
911 break;
912 }
913 }
914 }
915 spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
916 }
917
918 /*
919 * vmbus_ongpadl_created - GPADL created handler.
920 *
921 * This is invoked when we received a response to our gpadl create request.
922 * Find the matching request, copy the response and signal the requesting
923 * thread.
924 */
925 static void vmbus_ongpadl_created(struct vmbus_channel_message_header *hdr)
926 {
927 struct vmbus_channel_gpadl_created *gpadlcreated;
928 struct vmbus_channel_msginfo *msginfo;
929 struct vmbus_channel_message_header *requestheader;
930 struct vmbus_channel_gpadl_header *gpadlheader;
931 unsigned long flags;
932
933 gpadlcreated = (struct vmbus_channel_gpadl_created *)hdr;
934
935 /*
936 * Find the establish msg, copy the result and signal/unblock the wait
937 * event
938 */
939 spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
940
941 list_for_each_entry(msginfo, &vmbus_connection.chn_msg_list,
942 msglistentry) {
943 requestheader =
944 (struct vmbus_channel_message_header *)msginfo->msg;
945
946 if (requestheader->msgtype == CHANNELMSG_GPADL_HEADER) {
947 gpadlheader =
948 (struct vmbus_channel_gpadl_header *)requestheader;
949
950 if ((gpadlcreated->child_relid ==
951 gpadlheader->child_relid) &&
952 (gpadlcreated->gpadl == gpadlheader->gpadl)) {
953 memcpy(&msginfo->response.gpadl_created,
954 gpadlcreated,
955 sizeof(
956 struct vmbus_channel_gpadl_created));
957 complete(&msginfo->waitevent);
958 break;
959 }
960 }
961 }
962 spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
963 }
964
965 /*
966 * vmbus_ongpadl_torndown - GPADL torndown handler.
967 *
968 * This is invoked when we received a response to our gpadl teardown request.
969 * Find the matching request, copy the response and signal the requesting
970 * thread.
971 */
972 static void vmbus_ongpadl_torndown(
973 struct vmbus_channel_message_header *hdr)
974 {
975 struct vmbus_channel_gpadl_torndown *gpadl_torndown;
976 struct vmbus_channel_msginfo *msginfo;
977 struct vmbus_channel_message_header *requestheader;
978 struct vmbus_channel_gpadl_teardown *gpadl_teardown;
979 unsigned long flags;
980
981 gpadl_torndown = (struct vmbus_channel_gpadl_torndown *)hdr;
982
983 /*
984 * Find the open msg, copy the result and signal/unblock the wait event
985 */
986 spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
987
988 list_for_each_entry(msginfo, &vmbus_connection.chn_msg_list,
989 msglistentry) {
990 requestheader =
991 (struct vmbus_channel_message_header *)msginfo->msg;
992
993 if (requestheader->msgtype == CHANNELMSG_GPADL_TEARDOWN) {
994 gpadl_teardown =
995 (struct vmbus_channel_gpadl_teardown *)requestheader;
996
997 if (gpadl_torndown->gpadl == gpadl_teardown->gpadl) {
998 memcpy(&msginfo->response.gpadl_torndown,
999 gpadl_torndown,
1000 sizeof(
1001 struct vmbus_channel_gpadl_torndown));
1002 complete(&msginfo->waitevent);
1003 break;
1004 }
1005 }
1006 }
1007 spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
1008 }
1009
1010 /*
1011 * vmbus_onversion_response - Version response handler
1012 *
1013 * This is invoked when we received a response to our initiate contact request.
1014 * Find the matching request, copy the response and signal the requesting
1015 * thread.
1016 */
1017 static void vmbus_onversion_response(
1018 struct vmbus_channel_message_header *hdr)
1019 {
1020 struct vmbus_channel_msginfo *msginfo;
1021 struct vmbus_channel_message_header *requestheader;
1022 struct vmbus_channel_version_response *version_response;
1023 unsigned long flags;
1024
1025 version_response = (struct vmbus_channel_version_response *)hdr;
1026 spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
1027
1028 list_for_each_entry(msginfo, &vmbus_connection.chn_msg_list,
1029 msglistentry) {
1030 requestheader =
1031 (struct vmbus_channel_message_header *)msginfo->msg;
1032
1033 if (requestheader->msgtype ==
1034 CHANNELMSG_INITIATE_CONTACT) {
1035 memcpy(&msginfo->response.version_response,
1036 version_response,
1037 sizeof(struct vmbus_channel_version_response));
1038 complete(&msginfo->waitevent);
1039 }
1040 }
1041 spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
1042 }
1043
1044 /* Channel message dispatch table */
1045 struct vmbus_channel_message_table_entry
1046 channel_message_table[CHANNELMSG_COUNT] = {
1047 {CHANNELMSG_INVALID, 0, NULL},
1048 {CHANNELMSG_OFFERCHANNEL, 0, vmbus_onoffer},
1049 {CHANNELMSG_RESCIND_CHANNELOFFER, 0, vmbus_onoffer_rescind},
1050 {CHANNELMSG_REQUESTOFFERS, 0, NULL},
1051 {CHANNELMSG_ALLOFFERS_DELIVERED, 1, vmbus_onoffers_delivered},
1052 {CHANNELMSG_OPENCHANNEL, 0, NULL},
1053 {CHANNELMSG_OPENCHANNEL_RESULT, 1, vmbus_onopen_result},
1054 {CHANNELMSG_CLOSECHANNEL, 0, NULL},
1055 {CHANNELMSG_GPADL_HEADER, 0, NULL},
1056 {CHANNELMSG_GPADL_BODY, 0, NULL},
1057 {CHANNELMSG_GPADL_CREATED, 1, vmbus_ongpadl_created},
1058 {CHANNELMSG_GPADL_TEARDOWN, 0, NULL},
1059 {CHANNELMSG_GPADL_TORNDOWN, 1, vmbus_ongpadl_torndown},
1060 {CHANNELMSG_RELID_RELEASED, 0, NULL},
1061 {CHANNELMSG_INITIATE_CONTACT, 0, NULL},
1062 {CHANNELMSG_VERSION_RESPONSE, 1, vmbus_onversion_response},
1063 {CHANNELMSG_UNLOAD, 0, NULL},
1064 {CHANNELMSG_UNLOAD_RESPONSE, 1, vmbus_unload_response},
1065 {CHANNELMSG_18, 0, NULL},
1066 {CHANNELMSG_19, 0, NULL},
1067 {CHANNELMSG_20, 0, NULL},
1068 {CHANNELMSG_TL_CONNECT_REQUEST, 0, NULL},
1069 };
1070
1071 /*
1072 * vmbus_onmessage - Handler for channel protocol messages.
1073 *
1074 * This is invoked in the vmbus worker thread context.
1075 */
1076 void vmbus_onmessage(void *context)
1077 {
1078 struct hv_message *msg = context;
1079 struct vmbus_channel_message_header *hdr;
1080 int size;
1081
1082 hdr = (struct vmbus_channel_message_header *)msg->u.payload;
1083 size = msg->header.payload_size;
1084
1085 if (hdr->msgtype >= CHANNELMSG_COUNT) {
1086 pr_err("Received invalid channel message type %d size %d\n",
1087 hdr->msgtype, size);
1088 print_hex_dump_bytes("", DUMP_PREFIX_NONE,
1089 (unsigned char *)msg->u.payload, size);
1090 return;
1091 }
1092
1093 if (channel_message_table[hdr->msgtype].message_handler)
1094 channel_message_table[hdr->msgtype].message_handler(hdr);
1095 else
1096 pr_err("Unhandled channel message type %d\n", hdr->msgtype);
1097 }
1098
1099 /*
1100 * vmbus_request_offers - Send a request to get all our pending offers.
1101 */
1102 int vmbus_request_offers(void)
1103 {
1104 struct vmbus_channel_message_header *msg;
1105 struct vmbus_channel_msginfo *msginfo;
1106 int ret;
1107
1108 msginfo = kmalloc(sizeof(*msginfo) +
1109 sizeof(struct vmbus_channel_message_header),
1110 GFP_KERNEL);
1111 if (!msginfo)
1112 return -ENOMEM;
1113
1114 msg = (struct vmbus_channel_message_header *)msginfo->msg;
1115
1116 msg->msgtype = CHANNELMSG_REQUESTOFFERS;
1117
1118
1119 ret = vmbus_post_msg(msg,
1120 sizeof(struct vmbus_channel_message_header));
1121 if (ret != 0) {
1122 pr_err("Unable to request offers - %d\n", ret);
1123
1124 goto cleanup;
1125 }
1126
1127 cleanup:
1128 kfree(msginfo);
1129
1130 return ret;
1131 }
1132
1133 /*
1134 * Retrieve the (sub) channel on which to send an outgoing request.
1135 * When a primary channel has multiple sub-channels, we try to
1136 * distribute the load equally amongst all available channels.
1137 */
1138 struct vmbus_channel *vmbus_get_outgoing_channel(struct vmbus_channel *primary)
1139 {
1140 struct list_head *cur, *tmp;
1141 int cur_cpu;
1142 struct vmbus_channel *cur_channel;
1143 struct vmbus_channel *outgoing_channel = primary;
1144 int next_channel;
1145 int i = 1;
1146
1147 if (list_empty(&primary->sc_list))
1148 return outgoing_channel;
1149
1150 next_channel = primary->next_oc++;
1151
1152 if (next_channel > (primary->num_sc)) {
1153 primary->next_oc = 0;
1154 return outgoing_channel;
1155 }
1156
1157 cur_cpu = hv_context.vp_index[get_cpu()];
1158 put_cpu();
1159 list_for_each_safe(cur, tmp, &primary->sc_list) {
1160 cur_channel = list_entry(cur, struct vmbus_channel, sc_list);
1161 if (cur_channel->state != CHANNEL_OPENED_STATE)
1162 continue;
1163
1164 if (cur_channel->target_vp == cur_cpu)
1165 return cur_channel;
1166
1167 if (i == next_channel)
1168 return cur_channel;
1169
1170 i++;
1171 }
1172
1173 return outgoing_channel;
1174 }
1175 EXPORT_SYMBOL_GPL(vmbus_get_outgoing_channel);
1176
1177 static void invoke_sc_cb(struct vmbus_channel *primary_channel)
1178 {
1179 struct list_head *cur, *tmp;
1180 struct vmbus_channel *cur_channel;
1181
1182 if (primary_channel->sc_creation_callback == NULL)
1183 return;
1184
1185 list_for_each_safe(cur, tmp, &primary_channel->sc_list) {
1186 cur_channel = list_entry(cur, struct vmbus_channel, sc_list);
1187
1188 primary_channel->sc_creation_callback(cur_channel);
1189 }
1190 }
1191
1192 void vmbus_set_sc_create_callback(struct vmbus_channel *primary_channel,
1193 void (*sc_cr_cb)(struct vmbus_channel *new_sc))
1194 {
1195 primary_channel->sc_creation_callback = sc_cr_cb;
1196 }
1197 EXPORT_SYMBOL_GPL(vmbus_set_sc_create_callback);
1198
1199 bool vmbus_are_subchannels_present(struct vmbus_channel *primary)
1200 {
1201 bool ret;
1202
1203 ret = !list_empty(&primary->sc_list);
1204
1205 if (ret) {
1206 /*
1207 * Invoke the callback on sub-channel creation.
1208 * This will present a uniform interface to the
1209 * clients.
1210 */
1211 invoke_sc_cb(primary);
1212 }
1213
1214 return ret;
1215 }
1216 EXPORT_SYMBOL_GPL(vmbus_are_subchannels_present);
1217
1218 void vmbus_set_chn_rescind_callback(struct vmbus_channel *channel,
1219 void (*chn_rescind_cb)(struct vmbus_channel *))
1220 {
1221 channel->chn_rescind_callback = chn_rescind_cb;
1222 }
1223 EXPORT_SYMBOL_GPL(vmbus_set_chn_rescind_callback);