vmbus_drv.c 24.0 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19
/*
 * Copyright (c) 2009, Microsoft Corporation.
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms and conditions of the GNU General Public License,
 * version 2, as published by the Free Software Foundation.
 *
 * This program is distributed in the hope it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
 * more details.
 *
 * You should have received a copy of the GNU General Public License along with
 * this program; if not, write to the Free Software Foundation, Inc., 59 Temple
 * Place - Suite 330, Boston, MA 02111-1307 USA.
 *
 * Authors:
 *   Haiyang Zhang <haiyangz@microsoft.com>
 *   Hank Janssen  <hjanssen@microsoft.com>
20
 *   K. Y. Srinivasan <kys@microsoft.com>
21
 *
22
 */
23 24
#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt

25 26 27 28 29
#include <linux/init.h>
#include <linux/module.h>
#include <linux/device.h>
#include <linux/interrupt.h>
#include <linux/sysctl.h>
30
#include <linux/slab.h>
31
#include <linux/acpi.h>
32
#include <linux/completion.h>
33
#include <linux/hyperv.h>
34
#include <linux/kernel_stat.h>
35
#include <asm/hyperv.h>
36
#include <asm/hypervisor.h>
37
#include <asm/mshyperv.h>
38
#include "hyperv_vmbus.h"
39

40
static struct acpi_device  *hv_acpi_dev;
41

42
static struct tasklet_struct msg_dpc;
43
static struct completion probe_event;
44
static int irq;
45

46 47 48 49 50 51 52 53
static int vmbus_exists(void)
{
	if (hv_acpi_dev == NULL)
		return -ENODEV;

	return 0;
}

54 55 56 57 58 59 60 61
#define VMBUS_ALIAS_LEN ((sizeof((struct hv_vmbus_device_id *)0)->guid) * 2)
static void print_alias_name(struct hv_device *hv_dev, char *alias_name)
{
	int i;
	for (i = 0; i < VMBUS_ALIAS_LEN; i += 2)
		sprintf(&alias_name[i], "%02x", hv_dev->dev_type.b[i/2]);
}

62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78
static u8 channel_monitor_group(struct vmbus_channel *channel)
{
	return (u8)channel->offermsg.monitorid / 32;
}

static u8 channel_monitor_offset(struct vmbus_channel *channel)
{
	return (u8)channel->offermsg.monitorid % 32;
}

static u32 channel_pending(struct vmbus_channel *channel,
			   struct hv_monitor_page *monitor_page)
{
	u8 monitor_group = channel_monitor_group(channel);
	return monitor_page->trigger_group[monitor_group].pending;
}

79 80 81 82 83 84 85 86
static u32 channel_latency(struct vmbus_channel *channel,
			   struct hv_monitor_page *monitor_page)
{
	u8 monitor_group = channel_monitor_group(channel);
	u8 monitor_offset = channel_monitor_offset(channel);
	return monitor_page->latency[monitor_group][monitor_offset];
}

87 88 89 90 91 92 93 94
static u32 channel_conn_id(struct vmbus_channel *channel,
			   struct hv_monitor_page *monitor_page)
{
	u8 monitor_group = channel_monitor_group(channel);
	u8 monitor_offset = channel_monitor_offset(channel);
	return monitor_page->parameter[monitor_group][monitor_offset].connectionid.u.id;
}

95 96 97 98 99 100 101 102 103 104 105
static ssize_t id_show(struct device *dev, struct device_attribute *dev_attr,
		       char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);

	if (!hv_dev->channel)
		return -ENODEV;
	return sprintf(buf, "%d\n", hv_dev->channel->offermsg.child_relid);
}
static DEVICE_ATTR_RO(id);

106 107 108 109 110 111 112 113 114 115 116
static ssize_t state_show(struct device *dev, struct device_attribute *dev_attr,
			  char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);

	if (!hv_dev->channel)
		return -ENODEV;
	return sprintf(buf, "%d\n", hv_dev->channel->state);
}
static DEVICE_ATTR_RO(state);

117 118 119 120 121 122 123 124 125 126 127
static ssize_t monitor_id_show(struct device *dev,
			       struct device_attribute *dev_attr, char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);

	if (!hv_dev->channel)
		return -ENODEV;
	return sprintf(buf, "%d\n", hv_dev->channel->offermsg.monitorid);
}
static DEVICE_ATTR_RO(monitor_id);

128 129 130 131 132 133 134 135 136 137 138 139
static ssize_t class_id_show(struct device *dev,
			       struct device_attribute *dev_attr, char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);

	if (!hv_dev->channel)
		return -ENODEV;
	return sprintf(buf, "{%pUl}\n",
		       hv_dev->channel->offermsg.offer.if_type.b);
}
static DEVICE_ATTR_RO(class_id);

140 141 142 143 144 145 146 147 148 149 150 151
static ssize_t device_id_show(struct device *dev,
			      struct device_attribute *dev_attr, char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);

	if (!hv_dev->channel)
		return -ENODEV;
	return sprintf(buf, "{%pUl}\n",
		       hv_dev->channel->offermsg.offer.if_instance.b);
}
static DEVICE_ATTR_RO(device_id);

152 153 154 155 156 157 158 159 160 161 162
static ssize_t modalias_show(struct device *dev,
			     struct device_attribute *dev_attr, char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);
	char alias_name[VMBUS_ALIAS_LEN + 1];

	print_alias_name(hv_dev, alias_name);
	return sprintf(buf, "vmbus:%s\n", alias_name);
}
static DEVICE_ATTR_RO(modalias);

163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189
static ssize_t server_monitor_pending_show(struct device *dev,
					   struct device_attribute *dev_attr,
					   char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);

	if (!hv_dev->channel)
		return -ENODEV;
	return sprintf(buf, "%d\n",
		       channel_pending(hv_dev->channel,
				       vmbus_connection.monitor_pages[1]));
}
static DEVICE_ATTR_RO(server_monitor_pending);

static ssize_t client_monitor_pending_show(struct device *dev,
					   struct device_attribute *dev_attr,
					   char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);

	if (!hv_dev->channel)
		return -ENODEV;
	return sprintf(buf, "%d\n",
		       channel_pending(hv_dev->channel,
				       vmbus_connection.monitor_pages[1]));
}
static DEVICE_ATTR_RO(client_monitor_pending);
190

191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218
static ssize_t server_monitor_latency_show(struct device *dev,
					   struct device_attribute *dev_attr,
					   char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);

	if (!hv_dev->channel)
		return -ENODEV;
	return sprintf(buf, "%d\n",
		       channel_latency(hv_dev->channel,
				       vmbus_connection.monitor_pages[0]));
}
static DEVICE_ATTR_RO(server_monitor_latency);

static ssize_t client_monitor_latency_show(struct device *dev,
					   struct device_attribute *dev_attr,
					   char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);

	if (!hv_dev->channel)
		return -ENODEV;
	return sprintf(buf, "%d\n",
		       channel_latency(hv_dev->channel,
				       vmbus_connection.monitor_pages[1]));
}
static DEVICE_ATTR_RO(client_monitor_latency);

219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246
static ssize_t server_monitor_conn_id_show(struct device *dev,
					   struct device_attribute *dev_attr,
					   char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);

	if (!hv_dev->channel)
		return -ENODEV;
	return sprintf(buf, "%d\n",
		       channel_conn_id(hv_dev->channel,
				       vmbus_connection.monitor_pages[0]));
}
static DEVICE_ATTR_RO(server_monitor_conn_id);

static ssize_t client_monitor_conn_id_show(struct device *dev,
					   struct device_attribute *dev_attr,
					   char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);

	if (!hv_dev->channel)
		return -ENODEV;
	return sprintf(buf, "%d\n",
		       channel_conn_id(hv_dev->channel,
				       vmbus_connection.monitor_pages[1]));
}
static DEVICE_ATTR_RO(client_monitor_conn_id);

247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382
static ssize_t out_intr_mask_show(struct device *dev,
				  struct device_attribute *dev_attr, char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);
	struct hv_ring_buffer_debug_info outbound;

	if (!hv_dev->channel)
		return -ENODEV;
	hv_ringbuffer_get_debuginfo(&hv_dev->channel->outbound, &outbound);
	return sprintf(buf, "%d\n", outbound.current_interrupt_mask);
}
static DEVICE_ATTR_RO(out_intr_mask);

static ssize_t out_read_index_show(struct device *dev,
				   struct device_attribute *dev_attr, char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);
	struct hv_ring_buffer_debug_info outbound;

	if (!hv_dev->channel)
		return -ENODEV;
	hv_ringbuffer_get_debuginfo(&hv_dev->channel->outbound, &outbound);
	return sprintf(buf, "%d\n", outbound.current_read_index);
}
static DEVICE_ATTR_RO(out_read_index);

static ssize_t out_write_index_show(struct device *dev,
				    struct device_attribute *dev_attr,
				    char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);
	struct hv_ring_buffer_debug_info outbound;

	if (!hv_dev->channel)
		return -ENODEV;
	hv_ringbuffer_get_debuginfo(&hv_dev->channel->outbound, &outbound);
	return sprintf(buf, "%d\n", outbound.current_write_index);
}
static DEVICE_ATTR_RO(out_write_index);

static ssize_t out_read_bytes_avail_show(struct device *dev,
					 struct device_attribute *dev_attr,
					 char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);
	struct hv_ring_buffer_debug_info outbound;

	if (!hv_dev->channel)
		return -ENODEV;
	hv_ringbuffer_get_debuginfo(&hv_dev->channel->outbound, &outbound);
	return sprintf(buf, "%d\n", outbound.bytes_avail_toread);
}
static DEVICE_ATTR_RO(out_read_bytes_avail);

static ssize_t out_write_bytes_avail_show(struct device *dev,
					  struct device_attribute *dev_attr,
					  char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);
	struct hv_ring_buffer_debug_info outbound;

	if (!hv_dev->channel)
		return -ENODEV;
	hv_ringbuffer_get_debuginfo(&hv_dev->channel->outbound, &outbound);
	return sprintf(buf, "%d\n", outbound.bytes_avail_towrite);
}
static DEVICE_ATTR_RO(out_write_bytes_avail);

static ssize_t in_intr_mask_show(struct device *dev,
				 struct device_attribute *dev_attr, char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);
	struct hv_ring_buffer_debug_info inbound;

	if (!hv_dev->channel)
		return -ENODEV;
	hv_ringbuffer_get_debuginfo(&hv_dev->channel->inbound, &inbound);
	return sprintf(buf, "%d\n", inbound.current_interrupt_mask);
}
static DEVICE_ATTR_RO(in_intr_mask);

static ssize_t in_read_index_show(struct device *dev,
				  struct device_attribute *dev_attr, char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);
	struct hv_ring_buffer_debug_info inbound;

	if (!hv_dev->channel)
		return -ENODEV;
	hv_ringbuffer_get_debuginfo(&hv_dev->channel->inbound, &inbound);
	return sprintf(buf, "%d\n", inbound.current_read_index);
}
static DEVICE_ATTR_RO(in_read_index);

static ssize_t in_write_index_show(struct device *dev,
				   struct device_attribute *dev_attr, char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);
	struct hv_ring_buffer_debug_info inbound;

	if (!hv_dev->channel)
		return -ENODEV;
	hv_ringbuffer_get_debuginfo(&hv_dev->channel->inbound, &inbound);
	return sprintf(buf, "%d\n", inbound.current_write_index);
}
static DEVICE_ATTR_RO(in_write_index);

static ssize_t in_read_bytes_avail_show(struct device *dev,
					struct device_attribute *dev_attr,
					char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);
	struct hv_ring_buffer_debug_info inbound;

	if (!hv_dev->channel)
		return -ENODEV;
	hv_ringbuffer_get_debuginfo(&hv_dev->channel->inbound, &inbound);
	return sprintf(buf, "%d\n", inbound.bytes_avail_toread);
}
static DEVICE_ATTR_RO(in_read_bytes_avail);

static ssize_t in_write_bytes_avail_show(struct device *dev,
					 struct device_attribute *dev_attr,
					 char *buf)
{
	struct hv_device *hv_dev = device_to_hv_device(dev);
	struct hv_ring_buffer_debug_info inbound;

	if (!hv_dev->channel)
		return -ENODEV;
	hv_ringbuffer_get_debuginfo(&hv_dev->channel->inbound, &inbound);
	return sprintf(buf, "%d\n", inbound.bytes_avail_towrite);
}
static DEVICE_ATTR_RO(in_write_bytes_avail);

/* Set up per device attributes in /sys/bus/vmbus/devices/<bus device> */
383 384
static struct attribute *vmbus_attrs[] = {
	&dev_attr_id.attr,
385
	&dev_attr_state.attr,
386
	&dev_attr_monitor_id.attr,
387
	&dev_attr_class_id.attr,
388
	&dev_attr_device_id.attr,
389
	&dev_attr_modalias.attr,
390 391
	&dev_attr_server_monitor_pending.attr,
	&dev_attr_client_monitor_pending.attr,
392 393
	&dev_attr_server_monitor_latency.attr,
	&dev_attr_client_monitor_latency.attr,
394 395
	&dev_attr_server_monitor_conn_id.attr,
	&dev_attr_client_monitor_conn_id.attr,
396 397 398 399 400 401 402 403 404 405
	&dev_attr_out_intr_mask.attr,
	&dev_attr_out_read_index.attr,
	&dev_attr_out_write_index.attr,
	&dev_attr_out_read_bytes_avail.attr,
	&dev_attr_out_write_bytes_avail.attr,
	&dev_attr_in_intr_mask.attr,
	&dev_attr_in_read_index.attr,
	&dev_attr_in_write_index.attr,
	&dev_attr_in_read_bytes_avail.attr,
	&dev_attr_in_write_bytes_avail.attr,
406 407 408 409
	NULL,
};
ATTRIBUTE_GROUPS(vmbus);

410 411 412 413 414 415
/*
 * vmbus_uevent - add uevent for our device
 *
 * This routine is invoked when a device is added or removed on the vmbus to
 * generate a uevent to udev in the userspace. The udev will then look at its
 * rule and the uevent generated here to load the appropriate driver
416 417 418 419
 *
 * The alias string will be of the form vmbus:guid where guid is the string
 * representation of the device guid (each byte of the guid will be
 * represented with two hex characters.
420 421 422 423
 */
static int vmbus_uevent(struct device *device, struct kobj_uevent_env *env)
{
	struct hv_device *dev = device_to_hv_device(device);
424 425
	int ret;
	char alias_name[VMBUS_ALIAS_LEN + 1];
426

427
	print_alias_name(dev, alias_name);
428 429
	ret = add_uevent_var(env, "MODALIAS=vmbus:%s", alias_name);
	return ret;
430 431
}

432 433 434 435 436 437 438 439 440
static uuid_le null_guid;

static inline bool is_null_guid(const __u8 *guid)
{
	if (memcmp(guid, &null_guid, sizeof(uuid_le)))
		return false;
	return true;
}

441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456
/*
 * Return a matching hv_vmbus_device_id pointer.
 * If there is no match, return NULL.
 */
static const struct hv_vmbus_device_id *hv_vmbus_get_id(
					const struct hv_vmbus_device_id *id,
					__u8 *guid)
{
	for (; !is_null_guid(id->guid); id++)
		if (!memcmp(&id->guid, guid, sizeof(uuid_le)))
			return id;

	return NULL;
}


457 458 459 460 461 462 463

/*
 * vmbus_match - Attempt to match the specified device to the specified driver
 */
static int vmbus_match(struct device *device, struct device_driver *driver)
{
	struct hv_driver *drv = drv_to_hv_drv(driver);
464
	struct hv_device *hv_dev = device_to_hv_device(device);
465

466 467
	if (hv_vmbus_get_id(drv->id_table, hv_dev->dev_type.b))
		return 1;
468

469
	return 0;
470 471
}

472 473 474 475 476 477 478 479
/*
 * vmbus_probe - Add the new vmbus's child device
 */
static int vmbus_probe(struct device *child_device)
{
	int ret = 0;
	struct hv_driver *drv =
			drv_to_hv_drv(child_device->driver);
480
	struct hv_device *dev = device_to_hv_device(child_device);
481
	const struct hv_vmbus_device_id *dev_id;
482

483
	dev_id = hv_vmbus_get_id(drv->id_table, dev->dev_type.b);
484
	if (drv->probe) {
485
		ret = drv->probe(dev, dev_id);
486
		if (ret != 0)
487 488
			pr_err("probe failed for device %s (%d)\n",
			       dev_name(child_device), ret);
489 490

	} else {
491 492
		pr_err("probe not set for driver %s\n",
		       dev_name(child_device));
493
		ret = -ENODEV;
494 495 496 497
	}
	return ret;
}

498 499 500 501 502
/*
 * vmbus_remove - Remove a vmbus device
 */
static int vmbus_remove(struct device *child_device)
{
503
	struct hv_driver *drv = drv_to_hv_drv(child_device->driver);
504
	struct hv_device *dev = device_to_hv_device(child_device);
505

506 507 508 509 510
	if (drv->remove)
		drv->remove(dev);
	else
		pr_err("remove not set for driver %s\n",
			dev_name(child_device));
511 512 513 514

	return 0;
}

515 516 517 518 519 520 521

/*
 * vmbus_shutdown - Shutdown a vmbus device
 */
static void vmbus_shutdown(struct device *child_device)
{
	struct hv_driver *drv;
522
	struct hv_device *dev = device_to_hv_device(child_device);
523 524 525 526 527 528 529 530


	/* The device may not be attached yet */
	if (!child_device->driver)
		return;

	drv = drv_to_hv_drv(child_device->driver);

531 532
	if (drv->shutdown)
		drv->shutdown(dev);
533 534 535 536

	return;
}

537 538 539 540 541 542

/*
 * vmbus_device_release - Final callback release of the vmbus child device
 */
static void vmbus_device_release(struct device *device)
{
543
	struct hv_device *hv_dev = device_to_hv_device(device);
544

545
	kfree(hv_dev);
546 547 548

}

549
/* The one and only one */
550 551 552 553 554 555 556
static struct bus_type  hv_bus = {
	.name =		"vmbus",
	.match =		vmbus_match,
	.shutdown =		vmbus_shutdown,
	.remove =		vmbus_remove,
	.probe =		vmbus_probe,
	.uevent =		vmbus_uevent,
557
	.dev_groups =		vmbus_groups,
558 559
};

560 561 562 563 564 565 566 567 568 569 570 571 572 573 574
struct onmessage_work_context {
	struct work_struct work;
	struct hv_message msg;
};

static void vmbus_onmessage_work(struct work_struct *work)
{
	struct onmessage_work_context *ctx;

	ctx = container_of(work, struct onmessage_work_context,
			   work);
	vmbus_onmessage(&ctx->msg);
	kfree(ctx);
}

575
static void vmbus_on_msg_dpc(unsigned long data)
G
Greg Kroah-Hartman 已提交
576 577 578 579 580
{
	int cpu = smp_processor_id();
	void *page_addr = hv_context.synic_message_page[cpu];
	struct hv_message *msg = (struct hv_message *)page_addr +
				  VMBUS_MESSAGE_SINT;
581
	struct onmessage_work_context *ctx;
G
Greg Kroah-Hartman 已提交
582 583 584 585 586 587

	while (1) {
		if (msg->header.message_type == HVMSG_NONE) {
			/* no msg */
			break;
		} else {
588 589
			ctx = kmalloc(sizeof(*ctx), GFP_ATOMIC);
			if (ctx == NULL)
G
Greg Kroah-Hartman 已提交
590
				continue;
591 592
			INIT_WORK(&ctx->work, vmbus_onmessage_work);
			memcpy(&ctx->msg, msg, sizeof(*msg));
593
			queue_work(vmbus_connection.work_queue, &ctx->work);
G
Greg Kroah-Hartman 已提交
594 595 596 597 598 599 600 601 602 603 604
		}

		msg->header.message_type = HVMSG_NONE;

		/*
		 * Make sure the write to MessageType (ie set to
		 * HVMSG_NONE) happens before we read the
		 * MessagePending and EOMing. Otherwise, the EOMing
		 * will not deliver any more messages since there is
		 * no empty slot
		 */
605
		mb();
G
Greg Kroah-Hartman 已提交
606 607 608 609 610 611 612 613 614 615 616 617

		if (msg->header.message_flags.msg_pending) {
			/*
			 * This will cause message queue rescan to
			 * possibly deliver another msg from the
			 * hypervisor
			 */
			wrmsrl(HV_X64_MSR_EOM, 0);
		}
	}
}

618
static irqreturn_t vmbus_isr(int irq, void *dev_id)
G
Greg Kroah-Hartman 已提交
619 620 621 622 623
{
	int cpu = smp_processor_id();
	void *page_addr;
	struct hv_message *msg;
	union hv_synic_event_flags *event;
624
	bool handled = false;
G
Greg Kroah-Hartman 已提交
625

626 627 628 629 630 631
	page_addr = hv_context.synic_event_page[cpu];
	if (page_addr == NULL)
		return IRQ_NONE;

	event = (union hv_synic_event_flags *)page_addr +
					 VMBUS_MESSAGE_SINT;
632 633 634 635 636
	/*
	 * Check for events before checking for messages. This is the order
	 * in which events and messages are checked in Windows guests on
	 * Hyper-V, and the Windows team suggested we do the same.
	 */
G
Greg Kroah-Hartman 已提交
637

638 639
	if ((vmbus_proto_version == VERSION_WS2008) ||
		(vmbus_proto_version == VERSION_WIN7)) {
G
Greg Kroah-Hartman 已提交
640

641 642 643 644 645 646 647 648 649 650 651 652
		/* Since we are a child, we only need to check bit 0 */
		if (sync_test_and_clear_bit(0,
			(unsigned long *) &event->flags32[0])) {
			handled = true;
		}
	} else {
		/*
		 * Our host is win8 or above. The signaling mechanism
		 * has changed and we can directly look at the event page.
		 * If bit n is set then we have an interrup on the channel
		 * whose id is n.
		 */
653 654
		handled = true;
	}
655

656
	if (handled)
657
		tasklet_schedule(hv_context.event_dpc[cpu]);
658 659


660 661 662 663 664 665 666 667 668
	page_addr = hv_context.synic_message_page[cpu];
	msg = (struct hv_message *)page_addr + VMBUS_MESSAGE_SINT;

	/* Check if there are actual msgs to be processed */
	if (msg->header.message_type != HVMSG_NONE) {
		handled = true;
		tasklet_schedule(&msg_dpc);
	}

669
	if (handled)
670
		return IRQ_HANDLED;
671
	else
672 673 674
		return IRQ_NONE;
}

675
/*
676 677 678
 * vmbus_bus_init -Main vmbus driver initialization routine.
 *
 * Here, we
679 680 681 682
 *	- initialize the vmbus driver context
 *	- invoke the vmbus hv main init routine
 *	- get the irq resource
 *	- retrieve the channel offers
683
 */
684
static int vmbus_bus_init(int irq)
685
{
686
	int ret;
687

688 689
	/* Hypervisor initialization...setup hypercall page..etc */
	ret = hv_init();
690
	if (ret != 0) {
691
		pr_err("Unable to initialize the hypervisor - 0x%x\n", ret);
692
		return ret;
693 694
	}

695
	tasklet_init(&msg_dpc, vmbus_on_msg_dpc, 0);
696

697
	ret = bus_register(&hv_bus);
698
	if (ret)
699
		goto err_cleanup;
700

701
	ret = hv_setup_vmbus_irq(irq, vmbus_isr, hv_acpi_dev);
702

703
	if (ret != 0) {
704
		pr_err("Unable to request IRQ %d\n", irq);
705
		goto err_unregister;
706 707
	}

708 709 710
	ret = hv_synic_alloc();
	if (ret)
		goto err_alloc;
711
	/*
712
	 * Initialize the per-cpu interrupt state and
713 714
	 * connect to the host.
	 */
715
	on_each_cpu(hv_synic_init, NULL, 1);
716
	ret = vmbus_connect();
717
	if (ret)
718
		goto err_alloc;
719

720
	vmbus_request_offers();
721

722
	return 0;
723

724 725
err_alloc:
	hv_synic_free();
726
	hv_remove_vmbus_irq(irq, hv_acpi_dev);
727 728 729 730 731 732 733 734

err_unregister:
	bus_unregister(&hv_bus);

err_cleanup:
	hv_cleanup();

	return ret;
735 736
}

737
/**
738 739 740 741
 * __vmbus_child_driver_register - Register a vmbus's driver
 * @drv: Pointer to driver structure you want to register
 * @owner: owner module of the drv
 * @mod_name: module name string
742 743
 *
 * Registers the given driver with Linux through the 'driver_register()' call
744
 * and sets up the hyper-v vmbus handling for this driver.
745 746
 * It will return the state of the 'driver_register()' call.
 *
747
 */
748
int __vmbus_driver_register(struct hv_driver *hv_driver, struct module *owner, const char *mod_name)
749
{
750
	int ret;
751

752
	pr_info("registering driver %s\n", hv_driver->name);
753

754 755 756 757
	ret = vmbus_exists();
	if (ret < 0)
		return ret;

758 759 760 761
	hv_driver->driver.name = hv_driver->name;
	hv_driver->driver.owner = owner;
	hv_driver->driver.mod_name = mod_name;
	hv_driver->driver.bus = &hv_bus;
762

763
	ret = driver_register(&hv_driver->driver);
764

765
	return ret;
766
}
767
EXPORT_SYMBOL_GPL(__vmbus_driver_register);
768

769
/**
770 771
 * vmbus_driver_unregister() - Unregister a vmbus's driver
 * @drv: Pointer to driver structure you want to un-register
772
 *
773 774
 * Un-register the given driver that was previous registered with a call to
 * vmbus_driver_register()
775
 */
776
void vmbus_driver_unregister(struct hv_driver *hv_driver)
777
{
778
	pr_info("unregistering driver %s\n", hv_driver->name);
779

780
	if (!vmbus_exists())
781
		driver_unregister(&hv_driver->driver);
782
}
783
EXPORT_SYMBOL_GPL(vmbus_driver_unregister);
784

785
/*
786
 * vmbus_device_create - Creates and registers a new child device
787
 * on the vmbus.
788
 */
789
struct hv_device *vmbus_device_create(uuid_le *type,
790
					    uuid_le *instance,
791
					    struct vmbus_channel *channel)
792
{
793
	struct hv_device *child_device_obj;
794

795 796
	child_device_obj = kzalloc(sizeof(struct hv_device), GFP_KERNEL);
	if (!child_device_obj) {
797
		pr_err("Unable to allocate device object for child device\n");
798 799 800
		return NULL;
	}

801
	child_device_obj->channel = channel;
802
	memcpy(&child_device_obj->dev_type, type, sizeof(uuid_le));
803
	memcpy(&child_device_obj->dev_instance, instance,
804
	       sizeof(uuid_le));
805 806 807 808 809


	return child_device_obj;
}

810
/*
811
 * vmbus_device_register - Register the child device
812
 */
813
int vmbus_device_register(struct hv_device *child_device_obj)
814
{
815
	int ret = 0;
816

817
	static atomic_t device_num = ATOMIC_INIT(0);
818

819
	dev_set_name(&child_device_obj->device, "vmbus_0_%d",
820
		     atomic_inc_return(&device_num));
821

822
	child_device_obj->device.bus = &hv_bus;
823
	child_device_obj->device.parent = &hv_acpi_dev->dev;
824
	child_device_obj->device.release = vmbus_device_release;
825

826 827 828 829
	/*
	 * Register with the LDM. This will kick off the driver/device
	 * binding...which will eventually call vmbus_match() and vmbus_probe()
	 */
830
	ret = device_register(&child_device_obj->device);
831 832

	if (ret)
833
		pr_err("Unable to register child device\n");
834
	else
835
		pr_debug("child device %s registered\n",
836
			dev_name(&child_device_obj->device));
837 838 839 840

	return ret;
}

841
/*
842
 * vmbus_device_unregister - Remove the specified child device
843
 * from the vmbus.
844
 */
845
void vmbus_device_unregister(struct hv_device *device_obj)
846
{
847 848 849
	pr_debug("child device %s unregistered\n",
		dev_name(&device_obj->device));

850 851 852 853
	/*
	 * Kick off the process of unregistering the device.
	 * This will call vmbus_remove() and eventually vmbus_device_release()
	 */
854
	device_unregister(&device_obj->device);
855 856 857
}


858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879
/*
 * VMBUS is an acpi enumerated device. Get the the IRQ information
 * from DSDT.
 */

static acpi_status vmbus_walk_resources(struct acpi_resource *res, void *irq)
{

	if (res->type == ACPI_RESOURCE_TYPE_IRQ) {
		struct acpi_resource_irq *irqp;
		irqp = &res->data.irq;

		*((unsigned int *)irq) = irqp->interrupts[0];
	}

	return AE_OK;
}

static int vmbus_acpi_add(struct acpi_device *device)
{
	acpi_status result;

880 881
	hv_acpi_dev = device;

882 883
	result = acpi_walk_resources(device->handle, METHOD_NAME__CRS,
					vmbus_walk_resources, &irq);
884 885 886 887 888 889 890 891 892 893 894

	if (ACPI_FAILURE(result)) {
		complete(&probe_event);
		return -ENODEV;
	}
	complete(&probe_event);
	return 0;
}

static const struct acpi_device_id vmbus_acpi_device_ids[] = {
	{"VMBUS", 0},
895
	{"VMBus", 0},
896 897 898 899 900 901 902 903 904 905 906 907
	{"", 0},
};
MODULE_DEVICE_TABLE(acpi, vmbus_acpi_device_ids);

static struct acpi_driver vmbus_acpi_driver = {
	.name = "vmbus",
	.ids = vmbus_acpi_device_ids,
	.ops = {
		.add = vmbus_acpi_add,
	},
};

908
static int __init hv_acpi_init(void)
909
{
910
	int ret, t;
911

912
	if (x86_hyper != &x86_hyper_ms_hyperv)
913 914
		return -ENODEV;

915 916 917 918 919 920
	init_completion(&probe_event);

	/*
	 * Get irq resources first.
	 */

921 922
	ret = acpi_bus_register_driver(&vmbus_acpi_driver);

923 924 925
	if (ret)
		return ret;

926 927 928 929 930
	t = wait_for_completion_timeout(&probe_event, 5*HZ);
	if (t == 0) {
		ret = -ETIMEDOUT;
		goto cleanup;
	}
931 932

	if (irq <= 0) {
933 934
		ret = -ENODEV;
		goto cleanup;
935 936
	}

937 938
	ret = vmbus_bus_init(irq);
	if (ret)
939 940 941 942 943 944
		goto cleanup;

	return 0;

cleanup:
	acpi_bus_unregister_driver(&vmbus_acpi_driver);
945
	hv_acpi_dev = NULL;
946
	return ret;
947 948
}

949 950
static void __exit vmbus_exit(void)
{
951
	hv_remove_vmbus_irq(irq, hv_acpi_dev);
952 953 954 955 956 957
	vmbus_free_channels();
	bus_unregister(&hv_bus);
	hv_cleanup();
	acpi_bus_unregister_driver(&vmbus_acpi_driver);
}

958

959
MODULE_LICENSE("GPL");
960

961
subsys_initcall(hv_acpi_init);
962
module_exit(vmbus_exit);