channel.c 22.4 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20
/*
 * Copyright (c) 2009, Microsoft Corporation.
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms and conditions of the GNU General Public License,
 * version 2, as published by the Free Software Foundation.
 *
 * This program is distributed in the hope it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
 * more details.
 *
 * You should have received a copy of the GNU General Public License along with
 * this program; if not, write to the Free Software Foundation, Inc., 59 Temple
 * Place - Suite 330, Boston, MA 02111-1307 USA.
 *
 * Authors:
 *   Haiyang Zhang <haiyangz@microsoft.com>
 *   Hank Janssen  <hjanssen@microsoft.com>
 */
21 22
#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt

23
#include <linux/kernel.h>
24 25
#include <linux/sched.h>
#include <linux/wait.h>
26
#include <linux/mm.h>
27
#include <linux/slab.h>
28
#include <linux/module.h>
29
#include <linux/hyperv.h>
30

31
#include "hyperv_vmbus.h"
32

K
K. Y. Srinivasan 已提交
33 34 35
#define NUM_PAGES_SPANNED(addr, len) \
((PAGE_ALIGN(addr + len) >> PAGE_SHIFT) - (addr >> PAGE_SHIFT))

36
/*
37
 * vmbus_setevent- Trigger an event notification on the specified
38
 * channel.
39
 */
40
static void vmbus_setevent(struct vmbus_channel *channel)
41
{
42
	struct hv_monitor_page *monitorpage;
43

44
	if (channel->offermsg.monitor_allocated) {
45
		/* Each u32 represents 32 channels */
46
		sync_set_bit(channel->offermsg.child_relid & 31,
47
			(unsigned long *) vmbus_connection.send_int_page +
48
			(channel->offermsg.child_relid >> 5));
49

50
		monitorpage = vmbus_connection.monitor_pages;
51
		monitorpage++; /* Get the child to parent monitor page */
52

53
		sync_set_bit(channel->monitor_bit,
54 55
			(unsigned long *)&monitorpage->trigger_group
					[channel->monitor_grp].pending);
56

57
	} else {
58
		vmbus_set_event(channel);
59 60 61
	}
}

62
/*
63
 * vmbus_get_debug_info -Retrieve various channel debug info
64
 */
65
void vmbus_get_debug_info(struct vmbus_channel *channel,
66
			      struct vmbus_channel_debug_info *debuginfo)
67
{
68
	struct hv_monitor_page *monitorpage;
69 70
	u8 monitor_group = (u8)channel->offermsg.monitorid / 32;
	u8 monitor_offset = (u8)channel->offermsg.monitorid % 32;
71

72 73 74
	debuginfo->relid = channel->offermsg.child_relid;
	debuginfo->state = channel->state;
	memcpy(&debuginfo->interfacetype,
75
	       &channel->offermsg.offer.if_type, sizeof(uuid_le));
76
	memcpy(&debuginfo->interface_instance,
77
	       &channel->offermsg.offer.if_instance,
78
	       sizeof(uuid_le));
79

80
	monitorpage = (struct hv_monitor_page *)vmbus_connection.monitor_pages;
81

82
	debuginfo->monitorid = channel->offermsg.monitorid;
83

84
	debuginfo->servermonitor_pending =
85
			monitorpage->trigger_group[monitor_group].pending;
86
	debuginfo->servermonitor_latency =
87
			monitorpage->latency[monitor_group][monitor_offset];
88
	debuginfo->servermonitor_connectionid =
89 90
			monitorpage->parameter[monitor_group]
					[monitor_offset].connectionid.u.id;
91

92
	monitorpage++;
93

94
	debuginfo->clientmonitor_pending =
95
			monitorpage->trigger_group[monitor_group].pending;
96
	debuginfo->clientmonitor_latency =
97
			monitorpage->latency[monitor_group][monitor_offset];
98
	debuginfo->clientmonitor_connectionid =
99 100
			monitorpage->parameter[monitor_group]
					[monitor_offset].connectionid.u.id;
101

102 103
	hv_ringbuffer_get_debuginfo(&channel->inbound, &debuginfo->inbound);
	hv_ringbuffer_get_debuginfo(&channel->outbound, &debuginfo->outbound);
104 105
}

106
/*
107
 * vmbus_open - Open the specified channel.
108
 */
109
int vmbus_open(struct vmbus_channel *newchannel, u32 send_ringbuffer_size,
110 111
		     u32 recv_ringbuffer_size, void *userdata, u32 userdatalen,
		     void (*onchannelcallback)(void *context), void *context)
112
{
113
	struct vmbus_channel_open_channel *open_msg;
114
	struct vmbus_channel_msginfo *open_info = NULL;
115
	void *in, *out;
116
	unsigned long flags;
117
	int ret, t, err = 0;
118

119 120
	newchannel->onchannel_callback = onchannelcallback;
	newchannel->channel_callback_context = context;
121

122
	/* Allocate the ring buffer */
123 124 125
	out = (void *)__get_free_pages(GFP_KERNEL|__GFP_ZERO,
		get_order(send_ringbuffer_size + recv_ringbuffer_size));

126 127 128
	if (!out)
		return -ENOMEM;

129

130
	in = (void *)((unsigned long)out + send_ringbuffer_size);
131

132 133
	newchannel->ringbuffer_pages = out;
	newchannel->ringbuffer_pagecount = (send_ringbuffer_size +
134
					   recv_ringbuffer_size) >> PAGE_SHIFT;
135

136 137 138
	ret = hv_ringbuffer_init(
		&newchannel->outbound, out, send_ringbuffer_size);

139
	if (ret != 0) {
140
		err = ret;
141
		goto error0;
142 143
	}

144 145
	ret = hv_ringbuffer_init(
		&newchannel->inbound, in, recv_ringbuffer_size);
146
	if (ret != 0) {
147
		err = ret;
148
		goto error0;
149
	}
150 151


152
	/* Establish the gpadl for the ring buffer */
153
	newchannel->ringbuffer_gpadlhandle = 0;
154

155
	ret = vmbus_establish_gpadl(newchannel,
156
					 newchannel->outbound.ring_buffer,
157 158
					 send_ringbuffer_size +
					 recv_ringbuffer_size,
159
					 &newchannel->ringbuffer_gpadlhandle);
160

161
	if (ret != 0) {
162
		err = ret;
163
		goto error0;
164
	}
165

166
	/* Create and init the channel open message */
167
	open_info = kmalloc(sizeof(*open_info) +
168 169
			   sizeof(struct vmbus_channel_open_channel),
			   GFP_KERNEL);
170
	if (!open_info) {
171
		err = -ENOMEM;
172
		goto error0;
173
	}
174

175
	init_completion(&open_info->waitevent);
176

177
	open_msg = (struct vmbus_channel_open_channel *)open_info->msg;
178 179 180 181 182
	open_msg->header.msgtype = CHANNELMSG_OPENCHANNEL;
	open_msg->openid = newchannel->offermsg.child_relid;
	open_msg->child_relid = newchannel->offermsg.child_relid;
	open_msg->ringbuffer_gpadlhandle = newchannel->ringbuffer_gpadlhandle;
	open_msg->downstream_ringbuffer_pageoffset = send_ringbuffer_size >>
183
						  PAGE_SHIFT;
184
	open_msg->target_vp = newchannel->target_vp;
185

186
	if (userdatalen > MAX_USER_DEFINED_BYTES) {
187
		err = -EINVAL;
188
		goto error0;
189 190
	}

191
	if (userdatalen)
192
		memcpy(open_msg->userdata, userdata, userdatalen);
193

194
	spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
195
	list_add_tail(&open_info->msglistentry,
196
		      &vmbus_connection.chn_msg_list);
197
	spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
198

199
	ret = vmbus_post_msg(open_msg,
200
			       sizeof(struct vmbus_channel_open_channel));
201 202

	if (ret != 0)
203
		goto error1;
204

205
	t = wait_for_completion_timeout(&open_info->waitevent, 5*HZ);
206
	if (t == 0) {
207
		err = -ETIMEDOUT;
208
		goto error1;
209 210
	}

211

212 213
	if (open_info->response.open_result.status)
		err = open_info->response.open_result.status;
214

215
	spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
216
	list_del(&open_info->msglistentry);
217
	spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
218

219
	kfree(open_info);
220
	return err;
221

222 223 224 225 226 227
error1:
	spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
	list_del(&open_info->msglistentry);
	spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);

error0:
228 229
	free_pages((unsigned long)out,
		get_order(send_ringbuffer_size + recv_ringbuffer_size));
230
	kfree(open_info);
231
	return err;
232
}
233
EXPORT_SYMBOL_GPL(vmbus_open);
234

235
/*
236
 * create_gpadl_header - Creates a gpadl for the specified buffer
237
 */
238
static int create_gpadl_header(void *kbuffer, u32 size,
239 240
					 struct vmbus_channel_msginfo **msginfo,
					 u32 *messagecount)
241 242
{
	int i;
243
	int pagecount;
244
	unsigned long long pfn;
245 246 247 248 249
	struct vmbus_channel_gpadl_header *gpadl_header;
	struct vmbus_channel_gpadl_body *gpadl_body;
	struct vmbus_channel_msginfo *msgheader;
	struct vmbus_channel_msginfo *msgbody = NULL;
	u32 msgsize;
250

251
	int pfnsum, pfncount, pfnleft, pfncurr, pfnsize;
252

253 254
	pagecount = size >> PAGE_SHIFT;
	pfn = virt_to_phys(kbuffer) >> PAGE_SHIFT;
255

256
	/* do we need a gpadl body msg */
257
	pfnsize = MAX_SIZE_CHANNEL_MESSAGE -
258 259
		  sizeof(struct vmbus_channel_gpadl_header) -
		  sizeof(struct gpa_range);
260
	pfncount = pfnsize / sizeof(u64);
261

262
	if (pagecount > pfncount) {
263
		/* we need a gpadl body */
264
		/* fill in the header */
265
		msgsize = sizeof(struct vmbus_channel_msginfo) +
266
			  sizeof(struct vmbus_channel_gpadl_header) +
267 268 269
			  sizeof(struct gpa_range) + pfncount * sizeof(u64);
		msgheader =  kzalloc(msgsize, GFP_KERNEL);
		if (!msgheader)
270
			goto nomem;
271

272 273
		INIT_LIST_HEAD(&msgheader->submsglist);
		msgheader->msgsize = msgsize;
274

275
		gpadl_header = (struct vmbus_channel_gpadl_header *)
276 277 278
			msgheader->msg;
		gpadl_header->rangecount = 1;
		gpadl_header->range_buflen = sizeof(struct gpa_range) +
279
					 pagecount * sizeof(u64);
280 281
		gpadl_header->range[0].byte_offset = 0;
		gpadl_header->range[0].byte_count = size;
282
		for (i = 0; i < pfncount; i++)
283
			gpadl_header->range[0].pfn_array[i] = pfn+i;
284 285
		*msginfo = msgheader;
		*messagecount = 1;
286

287 288
		pfnsum = pfncount;
		pfnleft = pagecount - pfncount;
289

290
		/* how many pfns can we fit */
291
		pfnsize = MAX_SIZE_CHANNEL_MESSAGE -
292
			  sizeof(struct vmbus_channel_gpadl_body);
293
		pfncount = pfnsize / sizeof(u64);
294

295
		/* fill in the body */
296 297 298
		while (pfnleft) {
			if (pfnleft > pfncount)
				pfncurr = pfncount;
299
			else
300
				pfncurr = pfnleft;
301

302
			msgsize = sizeof(struct vmbus_channel_msginfo) +
303
				  sizeof(struct vmbus_channel_gpadl_body) +
304 305
				  pfncurr * sizeof(u64);
			msgbody = kzalloc(msgsize, GFP_KERNEL);
306 307 308 309 310 311 312 313 314 315 316 317 318 319 320

			if (!msgbody) {
				struct vmbus_channel_msginfo *pos = NULL;
				struct vmbus_channel_msginfo *tmp = NULL;
				/*
				 * Free up all the allocated messages.
				 */
				list_for_each_entry_safe(pos, tmp,
					&msgheader->submsglist,
					msglistentry) {

					list_del(&pos->msglistentry);
					kfree(pos);
				}

321
				goto nomem;
322 323
			}

324
			msgbody->msgsize = msgsize;
325 326
			(*messagecount)++;
			gpadl_body =
327
				(struct vmbus_channel_gpadl_body *)msgbody->msg;
328 329 330 331

			/*
			 * Gpadl is u32 and we are using a pointer which could
			 * be 64-bit
332 333
			 * This is governed by the guest/host protocol and
			 * so the hypervisor gurantees that this is ok.
334
			 */
335
			for (i = 0; i < pfncurr; i++)
336
				gpadl_body->pfn[i] = pfn + pfnsum + i;
337

338
			/* add to msg header */
339 340
			list_add_tail(&msgbody->msglistentry,
				      &msgheader->submsglist);
341 342
			pfnsum += pfncurr;
			pfnleft -= pfncurr;
343
		}
344
	} else {
345
		/* everything fits in a header */
346
		msgsize = sizeof(struct vmbus_channel_msginfo) +
347
			  sizeof(struct vmbus_channel_gpadl_header) +
348 349 350
			  sizeof(struct gpa_range) + pagecount * sizeof(u64);
		msgheader = kzalloc(msgsize, GFP_KERNEL);
		if (msgheader == NULL)
351
			goto nomem;
352
		msgheader->msgsize = msgsize;
353 354

		gpadl_header = (struct vmbus_channel_gpadl_header *)
355 356 357
			msgheader->msg;
		gpadl_header->rangecount = 1;
		gpadl_header->range_buflen = sizeof(struct gpa_range) +
358
					 pagecount * sizeof(u64);
359 360
		gpadl_header->range[0].byte_offset = 0;
		gpadl_header->range[0].byte_count = size;
361
		for (i = 0; i < pagecount; i++)
362
			gpadl_header->range[0].pfn_array[i] = pfn+i;
363 364 365

		*msginfo = msgheader;
		*messagecount = 1;
366 367 368
	}

	return 0;
369
nomem:
370 371
	kfree(msgheader);
	kfree(msgbody);
372
	return -ENOMEM;
373 374
}

375
/*
376
 * vmbus_establish_gpadl - Estabish a GPADL for the specified buffer
377
 *
378 379 380 381
 * @channel: a channel
 * @kbuffer: from kmalloc
 * @size: page-size multiple
 * @gpadl_handle: some funky thing
382
 */
383
int vmbus_establish_gpadl(struct vmbus_channel *channel, void *kbuffer,
384
			       u32 size, u32 *gpadl_handle)
385
{
386 387 388 389 390
	struct vmbus_channel_gpadl_header *gpadlmsg;
	struct vmbus_channel_gpadl_body *gpadl_body;
	struct vmbus_channel_msginfo *msginfo = NULL;
	struct vmbus_channel_msginfo *submsginfo;
	u32 msgcount;
391
	struct list_head *curr;
392
	u32 next_gpadl_handle;
393
	unsigned long flags;
394
	int ret = 0;
395
	int t;
396

397 398
	next_gpadl_handle = atomic_read(&vmbus_connection.next_gpadl_handle);
	atomic_inc(&vmbus_connection.next_gpadl_handle);
399

400
	ret = create_gpadl_header(kbuffer, size, &msginfo, &msgcount);
401 402
	if (ret)
		return ret;
403

404
	init_completion(&msginfo->waitevent);
405

406 407 408 409
	gpadlmsg = (struct vmbus_channel_gpadl_header *)msginfo->msg;
	gpadlmsg->header.msgtype = CHANNELMSG_GPADL_HEADER;
	gpadlmsg->child_relid = channel->offermsg.child_relid;
	gpadlmsg->gpadl = next_gpadl_handle;
410 411


412
	spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
413
	list_add_tail(&msginfo->msglistentry,
414
		      &vmbus_connection.chn_msg_list);
415

416
	spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
417

418
	ret = vmbus_post_msg(gpadlmsg, msginfo->msgsize -
419
			       sizeof(*msginfo));
420
	if (ret != 0)
421
		goto cleanup;
422

423
	if (msgcount > 1) {
424
		list_for_each(curr, &msginfo->submsglist) {
425

426 427
			submsginfo = (struct vmbus_channel_msginfo *)curr;
			gpadl_body =
428
			     (struct vmbus_channel_gpadl_body *)submsginfo->msg;
429

430 431 432
			gpadl_body->header.msgtype =
				CHANNELMSG_GPADL_BODY;
			gpadl_body->gpadl = next_gpadl_handle;
433

434
			ret = vmbus_post_msg(gpadl_body,
435
					       submsginfo->msgsize -
436
					       sizeof(*submsginfo));
437
			if (ret != 0)
438
				goto cleanup;
439

440 441
		}
	}
442
	t = wait_for_completion_timeout(&msginfo->waitevent, 5*HZ);
443
	BUG_ON(t == 0);
444

445

446
	/* At this point, we received the gpadl created msg */
447
	*gpadl_handle = gpadlmsg->gpadl;
448

449
cleanup:
450
	spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
451
	list_del(&msginfo->msglistentry);
452
	spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
453

454
	kfree(msginfo);
455 456
	return ret;
}
457
EXPORT_SYMBOL_GPL(vmbus_establish_gpadl);
458

459
/*
460
 * vmbus_teardown_gpadl -Teardown the specified GPADL handle
461
 */
462
int vmbus_teardown_gpadl(struct vmbus_channel *channel, u32 gpadl_handle)
463
{
464
	struct vmbus_channel_gpadl_teardown *msg;
465
	struct vmbus_channel_msginfo *info;
466
	unsigned long flags;
467
	int ret, t;
468

469 470
	info = kmalloc(sizeof(*info) +
		       sizeof(struct vmbus_channel_gpadl_teardown), GFP_KERNEL);
471 472
	if (!info)
		return -ENOMEM;
473

474
	init_completion(&info->waitevent);
475

476
	msg = (struct vmbus_channel_gpadl_teardown *)info->msg;
477

478 479 480
	msg->header.msgtype = CHANNELMSG_GPADL_TEARDOWN;
	msg->child_relid = channel->offermsg.child_relid;
	msg->gpadl = gpadl_handle;
481

482
	spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
483
	list_add_tail(&info->msglistentry,
484
		      &vmbus_connection.chn_msg_list);
485
	spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
486
	ret = vmbus_post_msg(msg,
487
			       sizeof(struct vmbus_channel_gpadl_teardown));
488

489
	BUG_ON(ret != 0);
490
	t = wait_for_completion_timeout(&info->waitevent, 5*HZ);
491
	BUG_ON(t == 0);
492

493
	/* Received a torndown response */
494
	spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
495
	list_del(&info->msglistentry);
496
	spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
497

498
	kfree(info);
499 500
	return ret;
}
501
EXPORT_SYMBOL_GPL(vmbus_teardown_gpadl);
502

503
/*
504
 * vmbus_close - Close the specified channel
505
 */
506
void vmbus_close(struct vmbus_channel *channel)
507
{
508
	struct vmbus_channel_close_channel *msg;
509
	int ret;
510
	unsigned long flags;
511

512
	/* Stop callback and cancel the timer asap */
513
	spin_lock_irqsave(&channel->inbound_lock, flags);
514
	channel->onchannel_callback = NULL;
515
	spin_unlock_irqrestore(&channel->inbound_lock, flags);
516

517
	/* Send a closing message */
518

519
	msg = &channel->close_msg.msg;
520

521 522
	msg->header.msgtype = CHANNELMSG_CLOSECHANNEL;
	msg->child_relid = channel->offermsg.child_relid;
523

524
	ret = vmbus_post_msg(msg, sizeof(struct vmbus_channel_close_channel));
525

526
	BUG_ON(ret != 0);
527
	/* Tear down the gpadl for the channel's ring buffer */
528
	if (channel->ringbuffer_gpadlhandle)
529
		vmbus_teardown_gpadl(channel,
530
					  channel->ringbuffer_gpadlhandle);
531

532
	/* Cleanup the ring buffers for this channel */
533 534
	hv_ringbuffer_cleanup(&channel->outbound);
	hv_ringbuffer_cleanup(&channel->inbound);
535

536 537
	free_pages((unsigned long)channel->ringbuffer_pages,
		get_order(channel->ringbuffer_pagecount * PAGE_SIZE));
538 539 540


}
541
EXPORT_SYMBOL_GPL(vmbus_close);
542

543
/**
544
 * vmbus_sendpacket() - Send the specified buffer on the given channel
545 546 547 548 549
 * @channel: Pointer to vmbus_channel structure.
 * @buffer: Pointer to the buffer you want to receive the data into.
 * @bufferlen: Maximum size of what the the buffer will hold
 * @requestid: Identifier of the request
 * @type: Type of packet that is being send e.g. negotiate, time
550 551
 * packet etc.
 *
552
 * Sends data in @buffer directly to hyper-v via the vmbus
553 554 555
 * This will send the data unparsed to hyper-v.
 *
 * Mainly used by Hyper-V drivers.
556
 */
557
int vmbus_sendpacket(struct vmbus_channel *channel, const void *buffer,
558 559
			   u32 bufferlen, u64 requestid,
			   enum vmbus_packet_type type, u32 flags)
560
{
561
	struct vmpacket_descriptor desc;
562
	u32 packetlen = sizeof(struct vmpacket_descriptor) + bufferlen;
563
	u32 packetlen_aligned = ALIGN(packetlen, sizeof(u64));
564 565
	struct scatterlist bufferlist[3];
	u64 aligned_data = 0;
566
	int ret;
567
	bool signal = false;
568 569


570
	/* Setup the descriptor */
571 572
	desc.type = type; /* VmbusPacketTypeDataInBand; */
	desc.flags = flags; /* VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED; */
573
	/* in 8-bytes granularity */
574 575 576
	desc.offset8 = sizeof(struct vmpacket_descriptor) >> 3;
	desc.len8 = (u16)(packetlen_aligned >> 3);
	desc.trans_id = requestid;
577

578 579 580 581 582
	sg_init_table(bufferlist, 3);
	sg_set_buf(&bufferlist[0], &desc, sizeof(struct vmpacket_descriptor));
	sg_set_buf(&bufferlist[1], buffer, bufferlen);
	sg_set_buf(&bufferlist[2], &aligned_data,
		   packetlen_aligned - packetlen);
583

584
	ret = hv_ringbuffer_write(&channel->outbound, bufferlist, 3, &signal);
585

586
	if (ret == 0 && signal)
587
		vmbus_setevent(channel);
588 589 590

	return ret;
}
591
EXPORT_SYMBOL(vmbus_sendpacket);
592

593
/*
594
 * vmbus_sendpacket_pagebuffer - Send a range of single-page buffer
595
 * packets using a GPADL Direct packet type.
596
 */
597
int vmbus_sendpacket_pagebuffer(struct vmbus_channel *channel,
598 599 600
				     struct hv_page_buffer pagebuffers[],
				     u32 pagecount, void *buffer, u32 bufferlen,
				     u64 requestid)
601
{
602 603
	int ret;
	int i;
604
	struct vmbus_channel_packet_page_buffer desc;
605 606 607 608 609
	u32 descsize;
	u32 packetlen;
	u32 packetlen_aligned;
	struct scatterlist bufferlist[3];
	u64 aligned_data = 0;
610
	bool signal = false;
611

612
	if (pagecount > MAX_PAGE_BUFFER_COUNT)
613
		return -EINVAL;
614 615


616
	/*
617
	 * Adjust the size down since vmbus_channel_packet_page_buffer is the
618 619
	 * largest size we support
	 */
620 621
	descsize = sizeof(struct vmbus_channel_packet_page_buffer) -
			  ((MAX_PAGE_BUFFER_COUNT - pagecount) *
622
			  sizeof(struct hv_page_buffer));
623
	packetlen = descsize + bufferlen;
624
	packetlen_aligned = ALIGN(packetlen, sizeof(u64));
625

626
	/* Setup the descriptor */
627
	desc.type = VM_PKT_DATA_USING_GPA_DIRECT;
628
	desc.flags = VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED;
629 630 631 632 633 634
	desc.dataoffset8 = descsize >> 3; /* in 8-bytes grandularity */
	desc.length8 = (u16)(packetlen_aligned >> 3);
	desc.transactionid = requestid;
	desc.rangecount = pagecount;

	for (i = 0; i < pagecount; i++) {
635 636 637
		desc.range[i].len = pagebuffers[i].len;
		desc.range[i].offset = pagebuffers[i].offset;
		desc.range[i].pfn	 = pagebuffers[i].pfn;
638 639
	}

640 641 642 643 644
	sg_init_table(bufferlist, 3);
	sg_set_buf(&bufferlist[0], &desc, descsize);
	sg_set_buf(&bufferlist[1], buffer, bufferlen);
	sg_set_buf(&bufferlist[2], &aligned_data,
		packetlen_aligned - packetlen);
645

646
	ret = hv_ringbuffer_write(&channel->outbound, bufferlist, 3, &signal);
647

648
	if (ret == 0 && signal)
649
		vmbus_setevent(channel);
650 651 652

	return ret;
}
653
EXPORT_SYMBOL_GPL(vmbus_sendpacket_pagebuffer);
654

655
/*
656
 * vmbus_sendpacket_multipagebuffer - Send a multi-page buffer packet
657
 * using a GPADL Direct packet type.
658
 */
659
int vmbus_sendpacket_multipagebuffer(struct vmbus_channel *channel,
660 661
				struct hv_multipage_buffer *multi_pagebuffer,
				void *buffer, u32 bufferlen, u64 requestid)
662
{
663
	int ret;
664
	struct vmbus_channel_packet_multipage_buffer desc;
665 666 667 668 669
	u32 descsize;
	u32 packetlen;
	u32 packetlen_aligned;
	struct scatterlist bufferlist[3];
	u64 aligned_data = 0;
670
	bool signal = false;
671 672
	u32 pfncount = NUM_PAGES_SPANNED(multi_pagebuffer->offset,
					 multi_pagebuffer->len);
673 674


675
	if ((pfncount < 0) || (pfncount > MAX_MULTIPAGE_BUFFER_COUNT))
676
		return -EINVAL;
677

678
	/*
679
	 * Adjust the size down since vmbus_channel_packet_multipage_buffer is
680 681
	 * the largest size we support
	 */
682 683
	descsize = sizeof(struct vmbus_channel_packet_multipage_buffer) -
			  ((MAX_MULTIPAGE_BUFFER_COUNT - pfncount) *
684
			  sizeof(u64));
685
	packetlen = descsize + bufferlen;
686
	packetlen_aligned = ALIGN(packetlen, sizeof(u64));
687 688


689
	/* Setup the descriptor */
690
	desc.type = VM_PKT_DATA_USING_GPA_DIRECT;
691
	desc.flags = VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED;
692 693 694
	desc.dataoffset8 = descsize >> 3; /* in 8-bytes grandularity */
	desc.length8 = (u16)(packetlen_aligned >> 3);
	desc.transactionid = requestid;
695
	desc.rangecount = 1;
696

697 698
	desc.range.len = multi_pagebuffer->len;
	desc.range.offset = multi_pagebuffer->offset;
699

700
	memcpy(desc.range.pfn_array, multi_pagebuffer->pfn_array,
701
	       pfncount * sizeof(u64));
702

703 704 705 706 707
	sg_init_table(bufferlist, 3);
	sg_set_buf(&bufferlist[0], &desc, descsize);
	sg_set_buf(&bufferlist[1], buffer, bufferlen);
	sg_set_buf(&bufferlist[2], &aligned_data,
		packetlen_aligned - packetlen);
708

709
	ret = hv_ringbuffer_write(&channel->outbound, bufferlist, 3, &signal);
710

711
	if (ret == 0 && signal)
712
		vmbus_setevent(channel);
713 714 715

	return ret;
}
716
EXPORT_SYMBOL_GPL(vmbus_sendpacket_multipagebuffer);
717 718

/**
719
 * vmbus_recvpacket() - Retrieve the user packet on the specified channel
720 721 722 723 724
 * @channel: Pointer to vmbus_channel structure.
 * @buffer: Pointer to the buffer you want to receive the data into.
 * @bufferlen: Maximum size of what the the buffer will hold
 * @buffer_actual_len: The actual size of the data after it was received
 * @requestid: Identifier of the request
725 726 727 728 729
 *
 * Receives directly from the hyper-v vmbus and puts the data it received
 * into Buffer. This will receive the data unparsed from hyper-v.
 *
 * Mainly used by Hyper-V drivers.
730
 */
731
int vmbus_recvpacket(struct vmbus_channel *channel, void *buffer,
732
			u32 bufferlen, u32 *buffer_actual_len, u64 *requestid)
733
{
734
	struct vmpacket_descriptor desc;
735 736
	u32 packetlen;
	u32 userlen;
737
	int ret;
738
	bool signal = false;
739

740 741
	*buffer_actual_len = 0;
	*requestid = 0;
742 743


744
	ret = hv_ringbuffer_peek(&channel->inbound, &desc,
745
			     sizeof(struct vmpacket_descriptor));
746
	if (ret != 0)
747 748
		return 0;

749 750
	packetlen = desc.len8 << 3;
	userlen = packetlen - (desc.offset8 << 3);
751

752
	*buffer_actual_len = userlen;
753

754
	if (userlen > bufferlen) {
755

756
		pr_err("Buffer too small - got %d needs %d\n",
757
			   bufferlen, userlen);
758
		return -ETOOSMALL;
759 760
	}

761
	*requestid = desc.trans_id;
762

763
	/* Copy over the packet to the user buffer */
764
	ret = hv_ringbuffer_read(&channel->inbound, buffer, userlen,
765
			     (desc.offset8 << 3), &signal);
766

767 768
	if (signal)
		vmbus_setevent(channel);
769 770 771

	return 0;
}
772
EXPORT_SYMBOL(vmbus_recvpacket);
773

774
/*
775
 * vmbus_recvpacket_raw - Retrieve the raw packet on the specified channel
776
 */
777
int vmbus_recvpacket_raw(struct vmbus_channel *channel, void *buffer,
778 779
			      u32 bufferlen, u32 *buffer_actual_len,
			      u64 *requestid)
780
{
781
	struct vmpacket_descriptor desc;
782
	u32 packetlen;
783
	int ret;
784
	bool signal = false;
785

786 787
	*buffer_actual_len = 0;
	*requestid = 0;
788 789


790
	ret = hv_ringbuffer_peek(&channel->inbound, &desc,
791
			     sizeof(struct vmpacket_descriptor));
792
	if (ret != 0)
793 794 795
		return 0;


796
	packetlen = desc.len8 << 3;
797

798
	*buffer_actual_len = packetlen;
799

800
	if (packetlen > bufferlen) {
801 802 803
		pr_err("Buffer too small - needed %d bytes but "
			"got space for only %d bytes\n",
			packetlen, bufferlen);
804
		return -ENOBUFS;
805 806
	}

807
	*requestid = desc.trans_id;
808

809
	/* Copy over the entire packet to the user buffer */
810 811 812 813 814
	ret = hv_ringbuffer_read(&channel->inbound, buffer, packetlen, 0,
				 &signal);

	if (signal)
		vmbus_setevent(channel);
815 816 817

	return 0;
}
818
EXPORT_SYMBOL_GPL(vmbus_recvpacket_raw);