xprt.c 32.9 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12
/*
 *  linux/net/sunrpc/xprt.c
 *
 *  This is a generic RPC call interface supporting congestion avoidance,
 *  and asynchronous calls.
 *
 *  The interface works like this:
 *
 *  -	When a process places a call, it allocates a request slot if
 *	one is available. Otherwise, it sleeps on the backlog queue
 *	(xprt_reserve).
 *  -	Next, the caller puts together the RPC message, stuffs it into
13 14
 *	the request struct, and calls xprt_transmit().
 *  -	xprt_transmit sends the message and installs the caller on the
15 16 17
 *	transport's wait list. At the same time, if a reply is expected,
 *	it installs a timer that is run after the packet's timeout has
 *	expired.
L
Linus Torvalds 已提交
18
 *  -	When a packet arrives, the data_ready handler walks the list of
19
 *	pending requests for that transport. If a matching XID is found, the
L
Linus Torvalds 已提交
20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35
 *	caller is woken up, and the timer removed.
 *  -	When no reply arrives within the timeout interval, the timer is
 *	fired by the kernel and runs xprt_timer(). It either adjusts the
 *	timeout values (minor timeout) or wakes up the caller with a status
 *	of -ETIMEDOUT.
 *  -	When the caller receives a notification from RPC that a reply arrived,
 *	it should release the RPC slot, and process the reply.
 *	If the call timed out, it may choose to retry the operation by
 *	adjusting the initial timeout value, and simply calling rpc_call
 *	again.
 *
 *  Support for async RPC is done through a set of RPC-specific scheduling
 *  primitives that `transparently' work for processes as well as async
 *  tasks that rely on callbacks.
 *
 *  Copyright (C) 1995-1997, Olaf Kirch <okir@monad.swb.de>
36 37
 *
 *  Transport switch API copyright (C) 2005, Chuck Lever <cel@netapp.com>
L
Linus Torvalds 已提交
38 39
 */

40 41
#include <linux/module.h>

L
Linus Torvalds 已提交
42
#include <linux/types.h>
43
#include <linux/interrupt.h>
L
Linus Torvalds 已提交
44
#include <linux/workqueue.h>
45
#include <linux/net.h>
46
#include <linux/ktime.h>
L
Linus Torvalds 已提交
47

48
#include <linux/sunrpc/clnt.h>
49
#include <linux/sunrpc/metrics.h>
50
#include <linux/sunrpc/bc_xprt.h>
L
Linus Torvalds 已提交
51

52 53
#include "sunrpc.h"

L
Linus Torvalds 已提交
54 55 56 57 58 59 60 61 62 63 64
/*
 * Local variables
 */

#ifdef RPC_DEBUG
# define RPCDBG_FACILITY	RPCDBG_XPRT
#endif

/*
 * Local functions
 */
65
static void	 xprt_init(struct rpc_xprt *xprt, struct net *net);
L
Linus Torvalds 已提交
66 67 68 69
static void	xprt_request_init(struct rpc_task *, struct rpc_xprt *);
static void	xprt_connect_status(struct rpc_task *task);
static int      __xprt_get_cong(struct rpc_xprt *, struct rpc_task *);

J
Jiri Slaby 已提交
70
static DEFINE_SPINLOCK(xprt_list_lock);
71 72
static LIST_HEAD(xprt_list);

73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89
/*
 * The transport code maintains an estimate on the maximum number of out-
 * standing RPC requests, using a smoothed version of the congestion
 * avoidance implemented in 44BSD. This is basically the Van Jacobson
 * congestion algorithm: If a retransmit occurs, the congestion window is
 * halved; otherwise, it is incremented by 1/cwnd when
 *
 *	-	a reply is received and
 *	-	a full number of requests are outstanding and
 *	-	the congestion window hasn't been updated recently.
 */
#define RPC_CWNDSHIFT		(8U)
#define RPC_CWNDSCALE		(1U << RPC_CWNDSHIFT)
#define RPC_INITCWND		RPC_CWNDSCALE
#define RPC_MAXCWND(xprt)	((xprt)->max_reqs << RPC_CWNDSHIFT)

#define RPCXPRT_CONGESTED(xprt) ((xprt)->cong >= (xprt)->cwnd)
L
Linus Torvalds 已提交
90

91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
/**
 * xprt_register_transport - register a transport implementation
 * @transport: transport to register
 *
 * If a transport implementation is loaded as a kernel module, it can
 * call this interface to make itself known to the RPC client.
 *
 * Returns:
 * 0:		transport successfully registered
 * -EEXIST:	transport already registered
 * -EINVAL:	transport module being unloaded
 */
int xprt_register_transport(struct xprt_class *transport)
{
	struct xprt_class *t;
	int result;

	result = -EEXIST;
	spin_lock(&xprt_list_lock);
	list_for_each_entry(t, &xprt_list, list) {
		/* don't register the same transport class twice */
112
		if (t->ident == transport->ident)
113 114 115
			goto out;
	}

116 117 118 119
	list_add_tail(&transport->list, &xprt_list);
	printk(KERN_INFO "RPC: Registered %s transport module.\n",
	       transport->name);
	result = 0;
120 121 122 123 124 125 126 127 128

out:
	spin_unlock(&xprt_list_lock);
	return result;
}
EXPORT_SYMBOL_GPL(xprt_register_transport);

/**
 * xprt_unregister_transport - unregister a transport implementation
129
 * @transport: transport to unregister
130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158
 *
 * Returns:
 * 0:		transport successfully unregistered
 * -ENOENT:	transport never registered
 */
int xprt_unregister_transport(struct xprt_class *transport)
{
	struct xprt_class *t;
	int result;

	result = 0;
	spin_lock(&xprt_list_lock);
	list_for_each_entry(t, &xprt_list, list) {
		if (t == transport) {
			printk(KERN_INFO
				"RPC: Unregistered %s transport module.\n",
				transport->name);
			list_del_init(&transport->list);
			goto out;
		}
	}
	result = -ENOENT;

out:
	spin_unlock(&xprt_list_lock);
	return result;
}
EXPORT_SYMBOL_GPL(xprt_unregister_transport);

159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180
/**
 * xprt_load_transport - load a transport implementation
 * @transport_name: transport to load
 *
 * Returns:
 * 0:		transport successfully loaded
 * -ENOENT:	transport module not available
 */
int xprt_load_transport(const char *transport_name)
{
	struct xprt_class *t;
	int result;

	result = 0;
	spin_lock(&xprt_list_lock);
	list_for_each_entry(t, &xprt_list, list) {
		if (strcmp(t->name, transport_name) == 0) {
			spin_unlock(&xprt_list_lock);
			goto out;
		}
	}
	spin_unlock(&xprt_list_lock);
181
	result = request_module("xprt%s", transport_name);
182 183 184 185 186
out:
	return result;
}
EXPORT_SYMBOL_GPL(xprt_load_transport);

187 188 189
/**
 * xprt_reserve_xprt - serialize write access to transports
 * @task: task that is requesting access to the transport
190
 * @xprt: pointer to the target transport
191 192 193 194 195
 *
 * This prevents mixing the payload of separate requests, and prevents
 * transport connects from colliding with writes.  No congestion control
 * is provided.
 */
196
int xprt_reserve_xprt(struct rpc_xprt *xprt, struct rpc_task *task)
197 198
{
	struct rpc_rqst *req = task->tk_rqstp;
199
	int priority;
200 201 202 203 204 205 206

	if (test_and_set_bit(XPRT_LOCKED, &xprt->state)) {
		if (task == xprt->snd_task)
			return 1;
		goto out_sleep;
	}
	xprt->snd_task = task;
207 208 209 210
	if (req != NULL) {
		req->rq_bytes_sent = 0;
		req->rq_ntrans++;
	}
211

212 213 214
	return 1;

out_sleep:
215
	dprintk("RPC: %5u failed to lock transport %p\n",
216 217 218
			task->tk_pid, xprt);
	task->tk_timeout = 0;
	task->tk_status = -EAGAIN;
219 220 221 222
	if (req == NULL)
		priority = RPC_PRIORITY_LOW;
	else if (!req->rq_ntrans)
		priority = RPC_PRIORITY_NORMAL;
223
	else
224 225
		priority = RPC_PRIORITY_HIGH;
	rpc_sleep_on_priority(&xprt->sending, task, NULL, priority);
226 227
	return 0;
}
228
EXPORT_SYMBOL_GPL(xprt_reserve_xprt);
229

230 231 232 233 234 235 236 237
static void xprt_clear_locked(struct rpc_xprt *xprt)
{
	xprt->snd_task = NULL;
	if (!test_bit(XPRT_CLOSE_WAIT, &xprt->state) || xprt->shutdown) {
		smp_mb__before_clear_bit();
		clear_bit(XPRT_LOCKED, &xprt->state);
		smp_mb__after_clear_bit();
	} else
238
		queue_work(rpciod_workqueue, &xprt->task_cleanup);
239 240
}

L
Linus Torvalds 已提交
241
/*
242 243 244 245 246 247
 * xprt_reserve_xprt_cong - serialize write access to transports
 * @task: task that is requesting access to the transport
 *
 * Same as xprt_reserve_xprt, but Van Jacobson congestion control is
 * integrated into the decision of whether a request is allowed to be
 * woken up and given access to the transport.
L
Linus Torvalds 已提交
248
 */
249
int xprt_reserve_xprt_cong(struct rpc_xprt *xprt, struct rpc_task *task)
L
Linus Torvalds 已提交
250 251
{
	struct rpc_rqst *req = task->tk_rqstp;
252
	int priority;
L
Linus Torvalds 已提交
253

254
	if (test_and_set_bit(XPRT_LOCKED, &xprt->state)) {
L
Linus Torvalds 已提交
255 256 257 258
		if (task == xprt->snd_task)
			return 1;
		goto out_sleep;
	}
259 260 261 262
	if (req == NULL) {
		xprt->snd_task = task;
		return 1;
	}
263
	if (__xprt_get_cong(xprt, task)) {
L
Linus Torvalds 已提交
264
		xprt->snd_task = task;
265 266
		req->rq_bytes_sent = 0;
		req->rq_ntrans++;
L
Linus Torvalds 已提交
267 268
		return 1;
	}
269
	xprt_clear_locked(xprt);
L
Linus Torvalds 已提交
270
out_sleep:
271
	dprintk("RPC: %5u failed to lock transport %p\n", task->tk_pid, xprt);
L
Linus Torvalds 已提交
272 273
	task->tk_timeout = 0;
	task->tk_status = -EAGAIN;
274 275 276 277
	if (req == NULL)
		priority = RPC_PRIORITY_LOW;
	else if (!req->rq_ntrans)
		priority = RPC_PRIORITY_NORMAL;
L
Linus Torvalds 已提交
278
	else
279 280
		priority = RPC_PRIORITY_HIGH;
	rpc_sleep_on_priority(&xprt->sending, task, NULL, priority);
L
Linus Torvalds 已提交
281 282
	return 0;
}
283
EXPORT_SYMBOL_GPL(xprt_reserve_xprt_cong);
L
Linus Torvalds 已提交
284

285
static inline int xprt_lock_write(struct rpc_xprt *xprt, struct rpc_task *task)
L
Linus Torvalds 已提交
286 287 288
{
	int retval;

C
Chuck Lever 已提交
289
	spin_lock_bh(&xprt->transport_lock);
290
	retval = xprt->ops->reserve_xprt(xprt, task);
C
Chuck Lever 已提交
291
	spin_unlock_bh(&xprt->transport_lock);
L
Linus Torvalds 已提交
292 293 294
	return retval;
}

295
static void __xprt_lock_write_next(struct rpc_xprt *xprt)
296 297 298 299 300 301 302
{
	struct rpc_task *task;
	struct rpc_rqst *req;

	if (test_and_set_bit(XPRT_LOCKED, &xprt->state))
		return;

303 304 305
	task = rpc_wake_up_next(&xprt->sending);
	if (task == NULL)
		goto out_unlock;
306 307 308 309 310 311 312 313 314 315

	req = task->tk_rqstp;
	xprt->snd_task = task;
	if (req) {
		req->rq_bytes_sent = 0;
		req->rq_ntrans++;
	}
	return;

out_unlock:
316
	xprt_clear_locked(xprt);
317 318 319
}

static void __xprt_lock_write_next_cong(struct rpc_xprt *xprt)
L
Linus Torvalds 已提交
320 321
{
	struct rpc_task *task;
322
	struct rpc_rqst *req;
L
Linus Torvalds 已提交
323

324
	if (test_and_set_bit(XPRT_LOCKED, &xprt->state))
L
Linus Torvalds 已提交
325
		return;
326
	if (RPCXPRT_CONGESTED(xprt))
L
Linus Torvalds 已提交
327
		goto out_unlock;
328 329 330
	task = rpc_wake_up_next(&xprt->sending);
	if (task == NULL)
		goto out_unlock;
331 332 333 334 335 336

	req = task->tk_rqstp;
	if (req == NULL) {
		xprt->snd_task = task;
		return;
	}
337
	if (__xprt_get_cong(xprt, task)) {
L
Linus Torvalds 已提交
338
		xprt->snd_task = task;
339 340
		req->rq_bytes_sent = 0;
		req->rq_ntrans++;
L
Linus Torvalds 已提交
341 342 343
		return;
	}
out_unlock:
344
	xprt_clear_locked(xprt);
L
Linus Torvalds 已提交
345 346
}

347 348 349 350 351 352
/**
 * xprt_release_xprt - allow other requests to use a transport
 * @xprt: transport with other tasks potentially waiting
 * @task: task that is releasing access to the transport
 *
 * Note that "task" can be NULL.  No congestion control is provided.
L
Linus Torvalds 已提交
353
 */
354
void xprt_release_xprt(struct rpc_xprt *xprt, struct rpc_task *task)
L
Linus Torvalds 已提交
355 356
{
	if (xprt->snd_task == task) {
357
		xprt_clear_locked(xprt);
L
Linus Torvalds 已提交
358 359 360
		__xprt_lock_write_next(xprt);
	}
}
361
EXPORT_SYMBOL_GPL(xprt_release_xprt);
L
Linus Torvalds 已提交
362

363 364 365 366 367 368 369 370 371 372 373
/**
 * xprt_release_xprt_cong - allow other requests to use a transport
 * @xprt: transport with other tasks potentially waiting
 * @task: task that is releasing access to the transport
 *
 * Note that "task" can be NULL.  Another task is awoken to use the
 * transport if the transport's congestion window allows it.
 */
void xprt_release_xprt_cong(struct rpc_xprt *xprt, struct rpc_task *task)
{
	if (xprt->snd_task == task) {
374
		xprt_clear_locked(xprt);
375 376 377
		__xprt_lock_write_next_cong(xprt);
	}
}
378
EXPORT_SYMBOL_GPL(xprt_release_xprt_cong);
379 380

static inline void xprt_release_write(struct rpc_xprt *xprt, struct rpc_task *task)
L
Linus Torvalds 已提交
381
{
C
Chuck Lever 已提交
382
	spin_lock_bh(&xprt->transport_lock);
383
	xprt->ops->release_xprt(xprt, task);
C
Chuck Lever 已提交
384
	spin_unlock_bh(&xprt->transport_lock);
L
Linus Torvalds 已提交
385 386 387 388 389 390 391 392 393 394 395 396 397
}

/*
 * Van Jacobson congestion avoidance. Check if the congestion window
 * overflowed. Put the task to sleep if this is the case.
 */
static int
__xprt_get_cong(struct rpc_xprt *xprt, struct rpc_task *task)
{
	struct rpc_rqst *req = task->tk_rqstp;

	if (req->rq_cong)
		return 1;
398
	dprintk("RPC: %5u xprt_cwnd_limited cong = %lu cwnd = %lu\n",
L
Linus Torvalds 已提交
399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417
			task->tk_pid, xprt->cong, xprt->cwnd);
	if (RPCXPRT_CONGESTED(xprt))
		return 0;
	req->rq_cong = 1;
	xprt->cong += RPC_CWNDSCALE;
	return 1;
}

/*
 * Adjust the congestion window, and wake up the next task
 * that has been sleeping due to congestion
 */
static void
__xprt_put_cong(struct rpc_xprt *xprt, struct rpc_rqst *req)
{
	if (!req->rq_cong)
		return;
	req->rq_cong = 0;
	xprt->cong -= RPC_CWNDSCALE;
418
	__xprt_lock_write_next_cong(xprt);
L
Linus Torvalds 已提交
419 420
}

421 422 423 424 425 426 427 428 429 430
/**
 * xprt_release_rqst_cong - housekeeping when request is complete
 * @task: RPC request that recently completed
 *
 * Useful for transports that require congestion control.
 */
void xprt_release_rqst_cong(struct rpc_task *task)
{
	__xprt_put_cong(task->tk_xprt, task->tk_rqstp);
}
431
EXPORT_SYMBOL_GPL(xprt_release_rqst_cong);
432

433 434 435 436 437
/**
 * xprt_adjust_cwnd - adjust transport congestion window
 * @task: recently completed RPC request used to adjust window
 * @result: result code of completed RPC request
 *
L
Linus Torvalds 已提交
438 439
 * We use a time-smoothed congestion estimator to avoid heavy oscillation.
 */
440
void xprt_adjust_cwnd(struct rpc_task *task, int result)
L
Linus Torvalds 已提交
441
{
442 443 444
	struct rpc_rqst *req = task->tk_rqstp;
	struct rpc_xprt *xprt = task->tk_xprt;
	unsigned long cwnd = xprt->cwnd;
L
Linus Torvalds 已提交
445 446 447 448 449 450 451

	if (result >= 0 && cwnd <= xprt->cong) {
		/* The (cwnd >> 1) term makes sure
		 * the result gets rounded properly. */
		cwnd += (RPC_CWNDSCALE * RPC_CWNDSCALE + (cwnd >> 1)) / cwnd;
		if (cwnd > RPC_MAXCWND(xprt))
			cwnd = RPC_MAXCWND(xprt);
452
		__xprt_lock_write_next_cong(xprt);
L
Linus Torvalds 已提交
453 454 455 456 457
	} else if (result == -ETIMEDOUT) {
		cwnd >>= 1;
		if (cwnd < RPC_CWNDSCALE)
			cwnd = RPC_CWNDSCALE;
	}
458
	dprintk("RPC:       cong %ld, cwnd was %ld, now %ld\n",
L
Linus Torvalds 已提交
459 460
			xprt->cong, xprt->cwnd, cwnd);
	xprt->cwnd = cwnd;
461
	__xprt_put_cong(xprt, req);
L
Linus Torvalds 已提交
462
}
463
EXPORT_SYMBOL_GPL(xprt_adjust_cwnd);
L
Linus Torvalds 已提交
464

465 466 467 468 469 470 471 472 473 474 475 476 477
/**
 * xprt_wake_pending_tasks - wake all tasks on a transport's pending queue
 * @xprt: transport with waiting tasks
 * @status: result code to plant in each task before waking it
 *
 */
void xprt_wake_pending_tasks(struct rpc_xprt *xprt, int status)
{
	if (status < 0)
		rpc_wake_up_status(&xprt->pending, status);
	else
		rpc_wake_up(&xprt->pending);
}
478
EXPORT_SYMBOL_GPL(xprt_wake_pending_tasks);
479

480 481 482
/**
 * xprt_wait_for_buffer_space - wait for transport output buffer to clear
 * @task: task to be put to sleep
R
Randy Dunlap 已提交
483
 * @action: function pointer to be executed after wait
484
 */
485
void xprt_wait_for_buffer_space(struct rpc_task *task, rpc_action action)
486 487 488 489 490
{
	struct rpc_rqst *req = task->tk_rqstp;
	struct rpc_xprt *xprt = req->rq_xprt;

	task->tk_timeout = req->rq_timeout;
491
	rpc_sleep_on(&xprt->pending, task, action);
492
}
493
EXPORT_SYMBOL_GPL(xprt_wait_for_buffer_space);
494 495 496 497 498 499 500 501 502 503 504 505 506 507

/**
 * xprt_write_space - wake the task waiting for transport output buffer space
 * @xprt: transport with waiting tasks
 *
 * Can be called in a soft IRQ context, so xprt_write_space never sleeps.
 */
void xprt_write_space(struct rpc_xprt *xprt)
{
	if (unlikely(xprt->shutdown))
		return;

	spin_lock_bh(&xprt->transport_lock);
	if (xprt->snd_task) {
508 509
		dprintk("RPC:       write space: waking waiting task on "
				"xprt %p\n", xprt);
510
		rpc_wake_up_queued_task(&xprt->pending, xprt->snd_task);
511 512 513
	}
	spin_unlock_bh(&xprt->transport_lock);
}
514
EXPORT_SYMBOL_GPL(xprt_write_space);
515

516 517 518 519 520 521 522 523 524 525 526 527
/**
 * xprt_set_retrans_timeout_def - set a request's retransmit timeout
 * @task: task whose timeout is to be set
 *
 * Set a request's retransmit timeout based on the transport's
 * default timeout parameters.  Used by transports that don't adjust
 * the retransmit timeout based on round-trip time estimation.
 */
void xprt_set_retrans_timeout_def(struct rpc_task *task)
{
	task->tk_timeout = task->tk_rqstp->rq_timeout;
}
528
EXPORT_SYMBOL_GPL(xprt_set_retrans_timeout_def);
529 530 531 532

/*
 * xprt_set_retrans_timeout_rtt - set a request's retransmit timeout
 * @task: task whose timeout is to be set
533
 *
534 535 536 537 538
 * Set a request's retransmit timeout using the RTT estimator.
 */
void xprt_set_retrans_timeout_rtt(struct rpc_task *task)
{
	int timer = task->tk_msg.rpc_proc->p_timer;
539 540
	struct rpc_clnt *clnt = task->tk_client;
	struct rpc_rtt *rtt = clnt->cl_rtt;
541
	struct rpc_rqst *req = task->tk_rqstp;
542
	unsigned long max_timeout = clnt->cl_timeout->to_maxval;
543 544 545 546 547 548

	task->tk_timeout = rpc_calc_rto(rtt, timer);
	task->tk_timeout <<= rpc_ntimeo(rtt, timer) + req->rq_retries;
	if (task->tk_timeout > max_timeout || task->tk_timeout == 0)
		task->tk_timeout = max_timeout;
}
549
EXPORT_SYMBOL_GPL(xprt_set_retrans_timeout_rtt);
550

L
Linus Torvalds 已提交
551 552
static void xprt_reset_majortimeo(struct rpc_rqst *req)
{
553
	const struct rpc_timeout *to = req->rq_task->tk_client->cl_timeout;
L
Linus Torvalds 已提交
554 555 556 557 558 559 560 561 562 563 564

	req->rq_majortimeo = req->rq_timeout;
	if (to->to_exponential)
		req->rq_majortimeo <<= to->to_retries;
	else
		req->rq_majortimeo += to->to_increment * to->to_retries;
	if (req->rq_majortimeo > to->to_maxval || req->rq_majortimeo == 0)
		req->rq_majortimeo = to->to_maxval;
	req->rq_majortimeo += jiffies;
}

565 566 567 568
/**
 * xprt_adjust_timeout - adjust timeout values for next retransmit
 * @req: RPC request containing parameters to use for the adjustment
 *
L
Linus Torvalds 已提交
569 570 571 572
 */
int xprt_adjust_timeout(struct rpc_rqst *req)
{
	struct rpc_xprt *xprt = req->rq_xprt;
573
	const struct rpc_timeout *to = req->rq_task->tk_client->cl_timeout;
L
Linus Torvalds 已提交
574 575 576 577 578 579 580 581 582 583 584 585 586 587 588
	int status = 0;

	if (time_before(jiffies, req->rq_majortimeo)) {
		if (to->to_exponential)
			req->rq_timeout <<= 1;
		else
			req->rq_timeout += to->to_increment;
		if (to->to_maxval && req->rq_timeout >= to->to_maxval)
			req->rq_timeout = to->to_maxval;
		req->rq_retries++;
	} else {
		req->rq_timeout = to->to_initval;
		req->rq_retries = 0;
		xprt_reset_majortimeo(req);
		/* Reset the RTT counters == "slow start" */
C
Chuck Lever 已提交
589
		spin_lock_bh(&xprt->transport_lock);
L
Linus Torvalds 已提交
590
		rpc_init_rtt(req->rq_task->tk_client->cl_rtt, to->to_initval);
C
Chuck Lever 已提交
591
		spin_unlock_bh(&xprt->transport_lock);
L
Linus Torvalds 已提交
592 593 594 595 596 597 598 599 600 601
		status = -ETIMEDOUT;
	}

	if (req->rq_timeout == 0) {
		printk(KERN_WARNING "xprt_adjust_timeout: rq_timeout = 0!\n");
		req->rq_timeout = 5 * HZ;
	}
	return status;
}

602
static void xprt_autoclose(struct work_struct *work)
L
Linus Torvalds 已提交
603
{
604 605
	struct rpc_xprt *xprt =
		container_of(work, struct rpc_xprt, task_cleanup);
L
Linus Torvalds 已提交
606

607
	xprt->ops->close(xprt);
608
	clear_bit(XPRT_CLOSE_WAIT, &xprt->state);
L
Linus Torvalds 已提交
609 610 611
	xprt_release_write(xprt, NULL);
}

612
/**
613
 * xprt_disconnect_done - mark a transport as disconnected
614 615
 * @xprt: transport to flag for disconnect
 *
L
Linus Torvalds 已提交
616
 */
617
void xprt_disconnect_done(struct rpc_xprt *xprt)
L
Linus Torvalds 已提交
618
{
619
	dprintk("RPC:       disconnected transport %p\n", xprt);
C
Chuck Lever 已提交
620
	spin_lock_bh(&xprt->transport_lock);
L
Linus Torvalds 已提交
621
	xprt_clear_connected(xprt);
622
	xprt_wake_pending_tasks(xprt, -EAGAIN);
C
Chuck Lever 已提交
623
	spin_unlock_bh(&xprt->transport_lock);
L
Linus Torvalds 已提交
624
}
625
EXPORT_SYMBOL_GPL(xprt_disconnect_done);
L
Linus Torvalds 已提交
626

627 628 629 630 631 632 633 634 635 636 637 638 639
/**
 * xprt_force_disconnect - force a transport to disconnect
 * @xprt: transport to disconnect
 *
 */
void xprt_force_disconnect(struct rpc_xprt *xprt)
{
	/* Don't race with the test_bit() in xprt_clear_locked() */
	spin_lock_bh(&xprt->transport_lock);
	set_bit(XPRT_CLOSE_WAIT, &xprt->state);
	/* Try to schedule an autoclose RPC call */
	if (test_and_set_bit(XPRT_LOCKED, &xprt->state) == 0)
		queue_work(rpciod_workqueue, &xprt->task_cleanup);
640
	xprt_wake_pending_tasks(xprt, -EAGAIN);
641 642 643
	spin_unlock_bh(&xprt->transport_lock);
}

644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666
/**
 * xprt_conditional_disconnect - force a transport to disconnect
 * @xprt: transport to disconnect
 * @cookie: 'connection cookie'
 *
 * This attempts to break the connection if and only if 'cookie' matches
 * the current transport 'connection cookie'. It ensures that we don't
 * try to break the connection more than once when we need to retransmit
 * a batch of RPC requests.
 *
 */
void xprt_conditional_disconnect(struct rpc_xprt *xprt, unsigned int cookie)
{
	/* Don't race with the test_bit() in xprt_clear_locked() */
	spin_lock_bh(&xprt->transport_lock);
	if (cookie != xprt->connect_cookie)
		goto out;
	if (test_bit(XPRT_CLOSING, &xprt->state) || !xprt_connected(xprt))
		goto out;
	set_bit(XPRT_CLOSE_WAIT, &xprt->state);
	/* Try to schedule an autoclose RPC call */
	if (test_and_set_bit(XPRT_LOCKED, &xprt->state) == 0)
		queue_work(rpciod_workqueue, &xprt->task_cleanup);
667
	xprt_wake_pending_tasks(xprt, -EAGAIN);
668 669 670 671
out:
	spin_unlock_bh(&xprt->transport_lock);
}

L
Linus Torvalds 已提交
672 673 674 675 676
static void
xprt_init_autodisconnect(unsigned long data)
{
	struct rpc_xprt *xprt = (struct rpc_xprt *)data;

C
Chuck Lever 已提交
677
	spin_lock(&xprt->transport_lock);
L
Linus Torvalds 已提交
678 679
	if (!list_empty(&xprt->recv) || xprt->shutdown)
		goto out_abort;
680
	if (test_and_set_bit(XPRT_LOCKED, &xprt->state))
L
Linus Torvalds 已提交
681
		goto out_abort;
C
Chuck Lever 已提交
682
	spin_unlock(&xprt->transport_lock);
683 684
	set_bit(XPRT_CONNECTION_CLOSE, &xprt->state);
	queue_work(rpciod_workqueue, &xprt->task_cleanup);
L
Linus Torvalds 已提交
685 686
	return;
out_abort:
C
Chuck Lever 已提交
687
	spin_unlock(&xprt->transport_lock);
L
Linus Torvalds 已提交
688 689
}

690 691 692
/**
 * xprt_connect - schedule a transport connect operation
 * @task: RPC task that is requesting the connect
L
Linus Torvalds 已提交
693 694 695 696 697 698
 *
 */
void xprt_connect(struct rpc_task *task)
{
	struct rpc_xprt	*xprt = task->tk_xprt;

699
	dprintk("RPC: %5u xprt_connect xprt %p %s connected\n", task->tk_pid,
L
Linus Torvalds 已提交
700 701
			xprt, (xprt_connected(xprt) ? "is" : "is not"));

702
	if (!xprt_bound(xprt)) {
703
		task->tk_status = -EAGAIN;
L
Linus Torvalds 已提交
704 705 706 707
		return;
	}
	if (!xprt_lock_write(xprt, task))
		return;
708 709 710 711

	if (test_and_clear_bit(XPRT_CLOSE_WAIT, &xprt->state))
		xprt->ops->close(xprt);

L
Linus Torvalds 已提交
712
	if (xprt_connected(xprt))
713 714 715 716
		xprt_release_write(xprt, task);
	else {
		if (task->tk_rqstp)
			task->tk_rqstp->rq_bytes_sent = 0;
L
Linus Torvalds 已提交
717

718
		task->tk_timeout = task->tk_rqstp->rq_timeout;
719
		rpc_sleep_on(&xprt->pending, task, xprt_connect_status);
720 721 722 723 724

		if (test_bit(XPRT_CLOSING, &xprt->state))
			return;
		if (xprt_test_and_set_connecting(xprt))
			return;
725
		xprt->stat.connect_start = jiffies;
726
		xprt->ops->connect(task);
L
Linus Torvalds 已提交
727 728 729
	}
}

730
static void xprt_connect_status(struct rpc_task *task)
L
Linus Torvalds 已提交
731 732 733
{
	struct rpc_xprt	*xprt = task->tk_xprt;

734
	if (task->tk_status == 0) {
735 736
		xprt->stat.connect_count++;
		xprt->stat.connect_time += (long)jiffies - xprt->stat.connect_start;
737
		dprintk("RPC: %5u xprt_connect_status: connection established\n",
L
Linus Torvalds 已提交
738 739 740 741 742
				task->tk_pid);
		return;
	}

	switch (task->tk_status) {
743 744
	case -EAGAIN:
		dprintk("RPC: %5u xprt_connect_status: retrying\n", task->tk_pid);
745
		break;
L
Linus Torvalds 已提交
746
	case -ETIMEDOUT:
747 748
		dprintk("RPC: %5u xprt_connect_status: connect attempt timed "
				"out\n", task->tk_pid);
L
Linus Torvalds 已提交
749 750
		break;
	default:
751 752 753
		dprintk("RPC: %5u xprt_connect_status: error %d connecting to "
				"server %s\n", task->tk_pid, -task->tk_status,
				task->tk_client->cl_server);
754 755
		xprt_release_write(xprt, task);
		task->tk_status = -EIO;
L
Linus Torvalds 已提交
756 757 758
	}
}

759 760 761 762 763
/**
 * xprt_lookup_rqst - find an RPC request corresponding to an XID
 * @xprt: transport on which the original request was transmitted
 * @xid: RPC XID of incoming reply
 *
L
Linus Torvalds 已提交
764
 */
765
struct rpc_rqst *xprt_lookup_rqst(struct rpc_xprt *xprt, __be32 xid)
L
Linus Torvalds 已提交
766
{
767
	struct rpc_rqst *entry;
L
Linus Torvalds 已提交
768

769
	list_for_each_entry(entry, &xprt->recv, rq_list)
770 771
		if (entry->rq_xid == xid)
			return entry;
772 773 774

	dprintk("RPC:       xprt_lookup_rqst did not find xid %08x\n",
			ntohl(xid));
775 776
	xprt->stat.bad_xids++;
	return NULL;
L
Linus Torvalds 已提交
777
}
778
EXPORT_SYMBOL_GPL(xprt_lookup_rqst);
L
Linus Torvalds 已提交
779

780
static void xprt_update_rtt(struct rpc_task *task)
781 782 783 784
{
	struct rpc_rqst *req = task->tk_rqstp;
	struct rpc_rtt *rtt = task->tk_client->cl_rtt;
	unsigned timer = task->tk_msg.rpc_proc->p_timer;
785
	long m = usecs_to_jiffies(ktime_to_us(req->rq_rtt));
786 787 788

	if (timer) {
		if (req->rq_ntrans == 1)
789
			rpc_update_rtt(rtt, timer, m);
790 791 792 793
		rpc_set_timeo(rtt, timer, req->rq_ntrans - 1);
	}
}

794 795
/**
 * xprt_complete_rqst - called when reply processing is complete
796
 * @task: RPC request that recently completed
797 798
 * @copied: actual number of bytes received from the transport
 *
799
 * Caller holds transport lock.
L
Linus Torvalds 已提交
800
 */
801
void xprt_complete_rqst(struct rpc_task *task, int copied)
L
Linus Torvalds 已提交
802
{
803
	struct rpc_rqst *req = task->tk_rqstp;
804
	struct rpc_xprt *xprt = req->rq_xprt;
L
Linus Torvalds 已提交
805

806 807
	dprintk("RPC: %5u xid %08x complete (%d bytes received)\n",
			task->tk_pid, ntohl(req->rq_xid), copied);
L
Linus Torvalds 已提交
808

809
	xprt->stat.recvs++;
810
	req->rq_rtt = ktime_sub(ktime_get(), req->rq_xtime);
811 812
	if (xprt->ops->timer != NULL)
		xprt_update_rtt(task);
813

L
Linus Torvalds 已提交
814
	list_del_init(&req->rq_list);
815
	req->rq_private_buf.len = copied;
816 817
	/* Ensure all writes are done before we update */
	/* req->rq_reply_bytes_recvd */
818
	smp_wmb();
819
	req->rq_reply_bytes_recvd = copied;
820
	rpc_wake_up_queued_task(&xprt->pending, task);
L
Linus Torvalds 已提交
821
}
822
EXPORT_SYMBOL_GPL(xprt_complete_rqst);
L
Linus Torvalds 已提交
823

824
static void xprt_timer(struct rpc_task *task)
L
Linus Torvalds 已提交
825
{
826
	struct rpc_rqst *req = task->tk_rqstp;
L
Linus Torvalds 已提交
827 828
	struct rpc_xprt *xprt = req->rq_xprt;

829 830
	if (task->tk_status != -ETIMEDOUT)
		return;
831
	dprintk("RPC: %5u xprt_timer\n", task->tk_pid);
L
Linus Torvalds 已提交
832

833
	spin_lock_bh(&xprt->transport_lock);
834
	if (!req->rq_reply_bytes_recvd) {
835 836
		if (xprt->ops->timer)
			xprt->ops->timer(task);
837 838 839
	} else
		task->tk_status = 0;
	spin_unlock_bh(&xprt->transport_lock);
L
Linus Torvalds 已提交
840 841
}

842 843 844 845 846
static inline int xprt_has_timer(struct rpc_xprt *xprt)
{
	return xprt->idle_timeout != 0;
}

847 848 849 850
/**
 * xprt_prepare_transmit - reserve the transport before sending a request
 * @task: RPC task about to send a request
 *
L
Linus Torvalds 已提交
851
 */
852
int xprt_prepare_transmit(struct rpc_task *task)
L
Linus Torvalds 已提交
853 854 855 856 857
{
	struct rpc_rqst	*req = task->tk_rqstp;
	struct rpc_xprt	*xprt = req->rq_xprt;
	int err = 0;

858
	dprintk("RPC: %5u xprt_prepare_transmit\n", task->tk_pid);
L
Linus Torvalds 已提交
859

C
Chuck Lever 已提交
860
	spin_lock_bh(&xprt->transport_lock);
861 862
	if (req->rq_reply_bytes_recvd && !req->rq_bytes_sent) {
		err = req->rq_reply_bytes_recvd;
L
Linus Torvalds 已提交
863 864
		goto out_unlock;
	}
865
	if (!xprt->ops->reserve_xprt(xprt, task))
L
Linus Torvalds 已提交
866 867
		err = -EAGAIN;
out_unlock:
C
Chuck Lever 已提交
868
	spin_unlock_bh(&xprt->transport_lock);
L
Linus Torvalds 已提交
869 870 871
	return err;
}

872
void xprt_end_transmit(struct rpc_task *task)
873
{
874
	xprt_release_write(task->tk_rqstp->rq_xprt, task);
875 876
}

877 878 879 880 881 882 883
/**
 * xprt_transmit - send an RPC request on a transport
 * @task: controlling RPC task
 *
 * We have to copy the iovec because sendmsg fiddles with its contents.
 */
void xprt_transmit(struct rpc_task *task)
L
Linus Torvalds 已提交
884 885 886
{
	struct rpc_rqst	*req = task->tk_rqstp;
	struct rpc_xprt	*xprt = req->rq_xprt;
887
	int status;
L
Linus Torvalds 已提交
888

889
	dprintk("RPC: %5u xprt_transmit(%u)\n", task->tk_pid, req->rq_slen);
L
Linus Torvalds 已提交
890

891
	if (!req->rq_reply_bytes_recvd) {
892 893 894 895
		if (list_empty(&req->rq_list) && rpc_reply_expected(task)) {
			/*
			 * Add to the list only if we're expecting a reply
			 */
C
Chuck Lever 已提交
896
			spin_lock_bh(&xprt->transport_lock);
L
Linus Torvalds 已提交
897 898 899 900 901
			/* Update the softirq receive buffer */
			memcpy(&req->rq_private_buf, &req->rq_rcv_buf,
					sizeof(req->rq_private_buf));
			/* Add request to the receive list */
			list_add_tail(&req->rq_list, &xprt->recv);
C
Chuck Lever 已提交
902
			spin_unlock_bh(&xprt->transport_lock);
L
Linus Torvalds 已提交
903
			xprt_reset_majortimeo(req);
904 905
			/* Turn off autodisconnect */
			del_singleshot_timer_sync(&xprt->timer);
L
Linus Torvalds 已提交
906 907 908 909
		}
	} else if (!req->rq_bytes_sent)
		return;

910
	req->rq_connect_cookie = xprt->connect_cookie;
911
	req->rq_xtime = ktime_get();
912
	status = xprt->ops->send_request(task);
913 914 915 916
	if (status != 0) {
		task->tk_status = status;
		return;
	}
917

918
	dprintk("RPC: %5u xmit complete\n", task->tk_pid);
919
	task->tk_flags |= RPC_TASK_SENT;
920
	spin_lock_bh(&xprt->transport_lock);
921

922
	xprt->ops->set_retrans_timeout(task);
923

924 925 926
	xprt->stat.sends++;
	xprt->stat.req_u += xprt->stat.sends - xprt->stat.recvs;
	xprt->stat.bklog_u += xprt->backlog.qlen;
L
Linus Torvalds 已提交
927

928 929 930
	/* Don't race with disconnect */
	if (!xprt_connected(xprt))
		task->tk_status = -ENOTCONN;
931
	else if (!req->rq_reply_bytes_recvd && rpc_reply_expected(task)) {
932 933 934 935
		/*
		 * Sleep on the pending queue since
		 * we're expecting a reply.
		 */
936
		rpc_sleep_on(&xprt->pending, task, xprt_timer);
937
	}
938
	spin_unlock_bh(&xprt->transport_lock);
L
Linus Torvalds 已提交
939 940
}

941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964
static struct rpc_rqst *xprt_dynamic_alloc_slot(struct rpc_xprt *xprt, gfp_t gfp_flags)
{
	struct rpc_rqst *req = ERR_PTR(-EAGAIN);

	if (!atomic_add_unless(&xprt->num_reqs, 1, xprt->max_reqs))
		goto out;
	req = kzalloc(sizeof(struct rpc_rqst), gfp_flags);
	if (req != NULL)
		goto out;
	atomic_dec(&xprt->num_reqs);
	req = ERR_PTR(-ENOMEM);
out:
	return req;
}

static bool xprt_dynamic_free_slot(struct rpc_xprt *xprt, struct rpc_rqst *req)
{
	if (atomic_add_unless(&xprt->num_reqs, -1, xprt->min_reqs)) {
		kfree(req);
		return true;
	}
	return false;
}

965
static void xprt_alloc_slot(struct rpc_task *task)
L
Linus Torvalds 已提交
966 967
{
	struct rpc_xprt	*xprt = task->tk_xprt;
968
	struct rpc_rqst *req;
L
Linus Torvalds 已提交
969 970

	if (!list_empty(&xprt->free)) {
971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986
		req = list_entry(xprt->free.next, struct rpc_rqst, rq_list);
		list_del(&req->rq_list);
		goto out_init_req;
	}
	req = xprt_dynamic_alloc_slot(xprt, GFP_NOWAIT);
	if (!IS_ERR(req))
		goto out_init_req;
	switch (PTR_ERR(req)) {
	case -ENOMEM:
		rpc_delay(task, HZ >> 2);
		dprintk("RPC:       dynamic allocation of request slot "
				"failed! Retrying\n");
		break;
	case -EAGAIN:
		rpc_sleep_on(&xprt->backlog, task, NULL);
		dprintk("RPC:       waiting for request slot\n");
L
Linus Torvalds 已提交
987 988
	}
	task->tk_status = -EAGAIN;
989 990 991 992 993
	return;
out_init_req:
	task->tk_status = 0;
	task->tk_rqstp = req;
	xprt_request_init(task, xprt);
L
Linus Torvalds 已提交
994 995
}

996 997 998
static void xprt_free_slot(struct rpc_xprt *xprt, struct rpc_rqst *req)
{
	spin_lock(&xprt->reserve_lock);
999 1000 1001 1002
	if (!xprt_dynamic_free_slot(xprt, req)) {
		memset(req, 0, sizeof(*req));	/* mark unused */
		list_add(&req->rq_list, &xprt->free);
	}
1003 1004 1005 1006
	rpc_wake_up_next(&xprt->backlog);
	spin_unlock(&xprt->reserve_lock);
}

1007 1008 1009 1010 1011 1012 1013 1014 1015 1016
static void xprt_free_all_slots(struct rpc_xprt *xprt)
{
	struct rpc_rqst *req;
	while (!list_empty(&xprt->free)) {
		req = list_first_entry(&xprt->free, struct rpc_rqst, rq_list);
		list_del(&req->rq_list);
		kfree(req);
	}
}

1017 1018 1019
struct rpc_xprt *xprt_alloc(struct net *net, size_t size,
		unsigned int num_prealloc,
		unsigned int max_alloc)
1020 1021
{
	struct rpc_xprt *xprt;
1022 1023
	struct rpc_rqst *req;
	int i;
1024 1025 1026 1027 1028

	xprt = kzalloc(size, GFP_KERNEL);
	if (xprt == NULL)
		goto out;

1029 1030 1031 1032 1033 1034 1035 1036 1037
	xprt_init(xprt, net);

	for (i = 0; i < num_prealloc; i++) {
		req = kzalloc(sizeof(struct rpc_rqst), GFP_KERNEL);
		if (!req)
			break;
		list_add(&req->rq_list, &xprt->free);
	}
	if (i < num_prealloc)
1038
		goto out_free;
1039 1040 1041 1042 1043 1044
	if (max_alloc > num_prealloc)
		xprt->max_reqs = max_alloc;
	else
		xprt->max_reqs = num_prealloc;
	xprt->min_reqs = num_prealloc;
	atomic_set(&xprt->num_reqs, num_prealloc);
1045 1046 1047 1048

	return xprt;

out_free:
1049
	xprt_free(xprt);
1050 1051 1052 1053 1054
out:
	return NULL;
}
EXPORT_SYMBOL_GPL(xprt_alloc);

1055 1056
void xprt_free(struct rpc_xprt *xprt)
{
P
Pavel Emelyanov 已提交
1057
	put_net(xprt->xprt_net);
1058
	xprt_free_all_slots(xprt);
1059 1060 1061 1062
	kfree(xprt);
}
EXPORT_SYMBOL_GPL(xprt_free);

1063 1064 1065 1066 1067 1068 1069 1070
/**
 * xprt_reserve - allocate an RPC request slot
 * @task: RPC task requesting a slot allocation
 *
 * If no more slots are available, place the task on the transport's
 * backlog queue.
 */
void xprt_reserve(struct rpc_task *task)
L
Linus Torvalds 已提交
1071 1072 1073
{
	struct rpc_xprt	*xprt = task->tk_xprt;

1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087
	task->tk_status = 0;
	if (task->tk_rqstp != NULL)
		return;

	/* Note: grabbing the xprt_lock_write() here is not strictly needed,
	 * but ensures that we throttle new slot allocation if the transport
	 * is congested (e.g. if reconnecting or if we're out of socket
	 * write buffer space).
	 */
	task->tk_timeout = 0;
	task->tk_status = -EAGAIN;
	if (!xprt_lock_write(xprt, task))
		return;

1088
	spin_lock(&xprt->reserve_lock);
1089
	xprt_alloc_slot(task);
1090
	spin_unlock(&xprt->reserve_lock);
1091
	xprt_release_write(xprt, task);
L
Linus Torvalds 已提交
1092 1093
}

1094
static inline __be32 xprt_alloc_xid(struct rpc_xprt *xprt)
L
Linus Torvalds 已提交
1095
{
1096
	return (__force __be32)xprt->xid++;
L
Linus Torvalds 已提交
1097 1098 1099 1100
}

static inline void xprt_init_xid(struct rpc_xprt *xprt)
{
1101
	xprt->xid = net_random();
L
Linus Torvalds 已提交
1102 1103
}

1104
static void xprt_request_init(struct rpc_task *task, struct rpc_xprt *xprt)
L
Linus Torvalds 已提交
1105 1106 1107
{
	struct rpc_rqst	*req = task->tk_rqstp;

1108
	INIT_LIST_HEAD(&req->rq_list);
1109
	req->rq_timeout = task->tk_client->cl_timeout->to_initval;
L
Linus Torvalds 已提交
1110 1111
	req->rq_task	= task;
	req->rq_xprt    = xprt;
1112
	req->rq_buffer  = NULL;
L
Linus Torvalds 已提交
1113
	req->rq_xid     = xprt_alloc_xid(xprt);
1114
	req->rq_release_snd_buf = NULL;
1115
	xprt_reset_majortimeo(req);
1116
	dprintk("RPC: %5u reserved req %p xid %08x\n", task->tk_pid,
L
Linus Torvalds 已提交
1117 1118 1119
			req, ntohl(req->rq_xid));
}

1120 1121 1122 1123
/**
 * xprt_release - release an RPC request slot
 * @task: task which is finished with the slot
 *
L
Linus Torvalds 已提交
1124
 */
1125
void xprt_release(struct rpc_task *task)
L
Linus Torvalds 已提交
1126
{
1127
	struct rpc_xprt	*xprt;
L
Linus Torvalds 已提交
1128 1129 1130 1131
	struct rpc_rqst	*req;

	if (!(req = task->tk_rqstp))
		return;
1132 1133

	xprt = req->rq_xprt;
1134
	rpc_count_iostats(task);
C
Chuck Lever 已提交
1135
	spin_lock_bh(&xprt->transport_lock);
1136
	xprt->ops->release_xprt(xprt, task);
1137 1138
	if (xprt->ops->release_request)
		xprt->ops->release_request(task);
L
Linus Torvalds 已提交
1139 1140 1141
	if (!list_empty(&req->rq_list))
		list_del(&req->rq_list);
	xprt->last_used = jiffies;
1142
	if (list_empty(&xprt->recv) && xprt_has_timer(xprt))
1143
		mod_timer(&xprt->timer,
1144
				xprt->last_used + xprt->idle_timeout);
C
Chuck Lever 已提交
1145
	spin_unlock_bh(&xprt->transport_lock);
1146
	if (req->rq_buffer)
1147
		xprt->ops->buf_free(req->rq_buffer);
1148 1149
	if (req->rq_cred != NULL)
		put_rpccred(req->rq_cred);
L
Linus Torvalds 已提交
1150
	task->tk_rqstp = NULL;
1151 1152
	if (req->rq_release_snd_buf)
		req->rq_release_snd_buf(req);
1153

1154
	dprintk("RPC: %5u release request %p\n", task->tk_pid, req);
1155 1156 1157
	if (likely(!bc_prealloc(req)))
		xprt_free_slot(xprt, req);
	else
1158
		xprt_free_bc_request(req);
L
Linus Torvalds 已提交
1159 1160
}

1161
static void xprt_init(struct rpc_xprt *xprt, struct net *net)
1162
{
1163
	atomic_set(&xprt->count, 1);
1164 1165 1166 1167 1168 1169

	spin_lock_init(&xprt->transport_lock);
	spin_lock_init(&xprt->reserve_lock);

	INIT_LIST_HEAD(&xprt->free);
	INIT_LIST_HEAD(&xprt->recv);
1170
#if defined(CONFIG_SUNRPC_BACKCHANNEL)
1171 1172
	spin_lock_init(&xprt->bc_pa_lock);
	INIT_LIST_HEAD(&xprt->bc_pa_list);
1173
#endif /* CONFIG_SUNRPC_BACKCHANNEL */
1174

1175 1176
	xprt->last_used = jiffies;
	xprt->cwnd = RPC_INITCWND;
1177
	xprt->bind_index = 0;
1178 1179 1180

	rpc_init_wait_queue(&xprt->binding, "xprt_binding");
	rpc_init_wait_queue(&xprt->pending, "xprt_pending");
1181
	rpc_init_priority_wait_queue(&xprt->sending, "xprt_sending");
1182 1183 1184 1185
	rpc_init_priority_wait_queue(&xprt->backlog, "xprt_backlog");

	xprt_init_xid(xprt);

1186
	xprt->xprt_net = get_net(net);
1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214
}

/**
 * xprt_create_transport - create an RPC transport
 * @args: rpc transport creation arguments
 *
 */
struct rpc_xprt *xprt_create_transport(struct xprt_create *args)
{
	struct rpc_xprt	*xprt;
	struct xprt_class *t;

	spin_lock(&xprt_list_lock);
	list_for_each_entry(t, &xprt_list, list) {
		if (t->ident == args->ident) {
			spin_unlock(&xprt_list_lock);
			goto found;
		}
	}
	spin_unlock(&xprt_list_lock);
	printk(KERN_ERR "RPC: transport (%d) not supported\n", args->ident);
	return ERR_PTR(-EIO);

found:
	xprt = t->setup(args);
	if (IS_ERR(xprt)) {
		dprintk("RPC:       xprt_create_transport: failed, %ld\n",
				-PTR_ERR(xprt));
1215
		goto out;
1216
	}
1217 1218 1219 1220 1221 1222
	INIT_WORK(&xprt->task_cleanup, xprt_autoclose);
	if (xprt_has_timer(xprt))
		setup_timer(&xprt->timer, xprt_init_autodisconnect,
			    (unsigned long)xprt);
	else
		init_timer(&xprt->timer);
1223
	dprintk("RPC:       created transport %p with %u slots\n", xprt,
1224
			xprt->max_reqs);
1225
out:
1226 1227 1228
	return xprt;
}

1229 1230
/**
 * xprt_destroy - destroy an RPC transport, killing off all requests.
1231
 * @xprt: transport to destroy
1232
 *
L
Linus Torvalds 已提交
1233
 */
1234
static void xprt_destroy(struct rpc_xprt *xprt)
L
Linus Torvalds 已提交
1235
{
1236
	dprintk("RPC:       destroying transport %p\n", xprt);
1237 1238
	xprt->shutdown = 1;
	del_timer_sync(&xprt->timer);
1239

1240 1241 1242 1243
	rpc_destroy_wait_queue(&xprt->binding);
	rpc_destroy_wait_queue(&xprt->pending);
	rpc_destroy_wait_queue(&xprt->sending);
	rpc_destroy_wait_queue(&xprt->backlog);
1244
	cancel_work_sync(&xprt->task_cleanup);
1245 1246 1247
	/*
	 * Tear down transport state and free the rpc_xprt
	 */
1248
	xprt->ops->destroy(xprt);
1249
}
L
Linus Torvalds 已提交
1250

1251 1252 1253 1254 1255 1256 1257
/**
 * xprt_put - release a reference to an RPC transport.
 * @xprt: pointer to the transport
 *
 */
void xprt_put(struct rpc_xprt *xprt)
{
1258 1259
	if (atomic_dec_and_test(&xprt->count))
		xprt_destroy(xprt);
1260 1261 1262 1263 1264 1265 1266 1267 1268
}

/**
 * xprt_get - return a reference to an RPC transport.
 * @xprt: pointer to the transport
 *
 */
struct rpc_xprt *xprt_get(struct rpc_xprt *xprt)
{
1269 1270 1271
	if (atomic_inc_not_zero(&xprt->count))
		return xprt;
	return NULL;
L
Linus Torvalds 已提交
1272
}