1 /*
2  * GPL HEADER START
3  *
4  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
5  *
6  * This program is free software; you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License version 2 only,
8  * as published by the Free Software Foundation.
9  *
10  * This program is distributed in the hope that it will be useful, but
11  * WITHOUT ANY WARRANTY; without even the implied warranty of
12  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
13  * General Public License version 2 for more details (a copy is included
14  * in the LICENSE file that accompanied this code).
15  *
16  * You should have received a copy of the GNU General Public License
17  * version 2 along with this program; If not, see
18  * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
19  *
20  * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
21  * CA 95054 USA or visit www.sun.com if you need additional information or
22  * have any questions.
23  *
24  * GPL HEADER END
25  */
26 /*
27  * Copyright (c) 2002, 2010, Oracle and/or its affiliates. All rights reserved.
28  * Use is subject to license terms.
29  *
30  * Copyright (c) 2010, 2012, Intel Corporation.
31  */
32 /*
33  * This file is part of Lustre, http://www.lustre.org/
34  * Lustre is a trademark of Sun Microsystems, Inc.
35  *
36  * lustre/ldlm/ldlm_lock.c
37  *
38  * Author: Peter Braam <braam@clusterfs.com>
39  * Author: Phil Schwan <phil@clusterfs.com>
40  */
41 
42 #define DEBUG_SUBSYSTEM S_LDLM
43 
44 #include "../../include/linux/libcfs/libcfs.h"
45 #include "../include/lustre_intent.h"
46 #include "../include/obd_class.h"
47 #include "ldlm_internal.h"
48 
49 /* lock types */
50 char *ldlm_lockname[] = {
51 	[0]		= "--",
52 	[LCK_EX]	= "EX",
53 	[LCK_PW]	= "PW",
54 	[LCK_PR]	= "PR",
55 	[LCK_CW]	= "CW",
56 	[LCK_CR]	= "CR",
57 	[LCK_NL]	= "NL",
58 	[LCK_GROUP]	= "GROUP",
59 	[LCK_COS]	= "COS",
60 };
61 EXPORT_SYMBOL(ldlm_lockname);
62 
63 static char *ldlm_typename[] = {
64 	[LDLM_PLAIN]	= "PLN",
65 	[LDLM_EXTENT]	= "EXT",
66 	[LDLM_FLOCK]	= "FLK",
67 	[LDLM_IBITS]	= "IBT",
68 };
69 
70 static ldlm_policy_wire_to_local_t ldlm_policy_wire18_to_local[] = {
71 	[LDLM_PLAIN - LDLM_MIN_TYPE]	= ldlm_plain_policy_wire_to_local,
72 	[LDLM_EXTENT - LDLM_MIN_TYPE]	= ldlm_extent_policy_wire_to_local,
73 	[LDLM_FLOCK - LDLM_MIN_TYPE]	= ldlm_flock_policy_wire18_to_local,
74 	[LDLM_IBITS - LDLM_MIN_TYPE]	= ldlm_ibits_policy_wire_to_local,
75 };
76 
77 static ldlm_policy_wire_to_local_t ldlm_policy_wire21_to_local[] = {
78 	[LDLM_PLAIN - LDLM_MIN_TYPE]	= ldlm_plain_policy_wire_to_local,
79 	[LDLM_EXTENT - LDLM_MIN_TYPE]	= ldlm_extent_policy_wire_to_local,
80 	[LDLM_FLOCK - LDLM_MIN_TYPE]	= ldlm_flock_policy_wire21_to_local,
81 	[LDLM_IBITS - LDLM_MIN_TYPE]	= ldlm_ibits_policy_wire_to_local,
82 };
83 
84 static ldlm_policy_local_to_wire_t ldlm_policy_local_to_wire[] = {
85 	[LDLM_PLAIN - LDLM_MIN_TYPE]	= ldlm_plain_policy_local_to_wire,
86 	[LDLM_EXTENT - LDLM_MIN_TYPE]	= ldlm_extent_policy_local_to_wire,
87 	[LDLM_FLOCK - LDLM_MIN_TYPE]	= ldlm_flock_policy_local_to_wire,
88 	[LDLM_IBITS - LDLM_MIN_TYPE]	= ldlm_ibits_policy_local_to_wire,
89 };
90 
91 /**
92  * Converts lock policy from local format to on the wire lock_desc format
93  */
ldlm_convert_policy_to_wire(ldlm_type_t type,const ldlm_policy_data_t * lpolicy,ldlm_wire_policy_data_t * wpolicy)94 static void ldlm_convert_policy_to_wire(ldlm_type_t type,
95 					const ldlm_policy_data_t *lpolicy,
96 					ldlm_wire_policy_data_t *wpolicy)
97 {
98 	ldlm_policy_local_to_wire_t convert;
99 
100 	convert = ldlm_policy_local_to_wire[type - LDLM_MIN_TYPE];
101 
102 	convert(lpolicy, wpolicy);
103 }
104 
105 /**
106  * Converts lock policy from on the wire lock_desc format to local format
107  */
ldlm_convert_policy_to_local(struct obd_export * exp,ldlm_type_t type,const ldlm_wire_policy_data_t * wpolicy,ldlm_policy_data_t * lpolicy)108 void ldlm_convert_policy_to_local(struct obd_export *exp, ldlm_type_t type,
109 				  const ldlm_wire_policy_data_t *wpolicy,
110 				  ldlm_policy_data_t *lpolicy)
111 {
112 	ldlm_policy_wire_to_local_t convert;
113 	int new_client;
114 
115 	/** some badness for 2.0.0 clients, but 2.0.0 isn't supported */
116 	new_client = (exp_connect_flags(exp) & OBD_CONNECT_FULL20) != 0;
117 	if (new_client)
118 		convert = ldlm_policy_wire21_to_local[type - LDLM_MIN_TYPE];
119 	else
120 		convert = ldlm_policy_wire18_to_local[type - LDLM_MIN_TYPE];
121 
122 	convert(wpolicy, lpolicy);
123 }
124 
ldlm_it2str(int it)125 char *ldlm_it2str(int it)
126 {
127 	switch (it) {
128 	case IT_OPEN:
129 		return "open";
130 	case IT_CREAT:
131 		return "creat";
132 	case (IT_OPEN | IT_CREAT):
133 		return "open|creat";
134 	case IT_READDIR:
135 		return "readdir";
136 	case IT_GETATTR:
137 		return "getattr";
138 	case IT_LOOKUP:
139 		return "lookup";
140 	case IT_UNLINK:
141 		return "unlink";
142 	case IT_GETXATTR:
143 		return "getxattr";
144 	case IT_LAYOUT:
145 		return "layout";
146 	default:
147 		CERROR("Unknown intent %d\n", it);
148 		return "UNKNOWN";
149 	}
150 }
151 EXPORT_SYMBOL(ldlm_it2str);
152 
153 /*
154  * REFCOUNTED LOCK OBJECTS
155  */
156 
157 /**
158  * Get a reference on a lock.
159  *
160  * Lock refcounts, during creation:
161  *   - one special one for allocation, dec'd only once in destroy
162  *   - one for being a lock that's in-use
163  *   - one for the addref associated with a new lock
164  */
ldlm_lock_get(struct ldlm_lock * lock)165 struct ldlm_lock *ldlm_lock_get(struct ldlm_lock *lock)
166 {
167 	atomic_inc(&lock->l_refc);
168 	return lock;
169 }
170 EXPORT_SYMBOL(ldlm_lock_get);
171 
172 /**
173  * Release lock reference.
174  *
175  * Also frees the lock if it was last reference.
176  */
ldlm_lock_put(struct ldlm_lock * lock)177 void ldlm_lock_put(struct ldlm_lock *lock)
178 {
179 	LASSERT(lock->l_resource != LP_POISON);
180 	LASSERT(atomic_read(&lock->l_refc) > 0);
181 	if (atomic_dec_and_test(&lock->l_refc)) {
182 		struct ldlm_resource *res;
183 
184 		LDLM_DEBUG(lock,
185 			   "final lock_put on destroyed lock, freeing it.");
186 
187 		res = lock->l_resource;
188 		LASSERT(lock->l_flags & LDLM_FL_DESTROYED);
189 		LASSERT(list_empty(&lock->l_res_link));
190 		LASSERT(list_empty(&lock->l_pending_chain));
191 
192 		lprocfs_counter_decr(ldlm_res_to_ns(res)->ns_stats,
193 				     LDLM_NSS_LOCKS);
194 		lu_ref_del(&res->lr_reference, "lock", lock);
195 		ldlm_resource_putref(res);
196 		lock->l_resource = NULL;
197 		if (lock->l_export) {
198 			class_export_lock_put(lock->l_export, lock);
199 			lock->l_export = NULL;
200 		}
201 
202 		kfree(lock->l_lvb_data);
203 
204 		ldlm_interval_free(ldlm_interval_detach(lock));
205 		lu_ref_fini(&lock->l_reference);
206 		OBD_FREE_RCU(lock, sizeof(*lock), &lock->l_handle);
207 	}
208 }
209 EXPORT_SYMBOL(ldlm_lock_put);
210 
211 /**
212  * Removes LDLM lock \a lock from LRU. Assumes LRU is already locked.
213  */
ldlm_lock_remove_from_lru_nolock(struct ldlm_lock * lock)214 int ldlm_lock_remove_from_lru_nolock(struct ldlm_lock *lock)
215 {
216 	int rc = 0;
217 
218 	if (!list_empty(&lock->l_lru)) {
219 		struct ldlm_namespace *ns = ldlm_lock_to_ns(lock);
220 
221 		LASSERT(lock->l_resource->lr_type != LDLM_FLOCK);
222 		list_del_init(&lock->l_lru);
223 		LASSERT(ns->ns_nr_unused > 0);
224 		ns->ns_nr_unused--;
225 		rc = 1;
226 	}
227 	return rc;
228 }
229 
230 /**
231  * Removes LDLM lock \a lock from LRU. Obtains the LRU lock first.
232  */
ldlm_lock_remove_from_lru(struct ldlm_lock * lock)233 int ldlm_lock_remove_from_lru(struct ldlm_lock *lock)
234 {
235 	struct ldlm_namespace *ns = ldlm_lock_to_ns(lock);
236 	int rc;
237 
238 	spin_lock(&ns->ns_lock);
239 	rc = ldlm_lock_remove_from_lru_nolock(lock);
240 	spin_unlock(&ns->ns_lock);
241 	return rc;
242 }
243 
244 /**
245  * Adds LDLM lock \a lock to namespace LRU. Assumes LRU is already locked.
246  */
ldlm_lock_add_to_lru_nolock(struct ldlm_lock * lock)247 static void ldlm_lock_add_to_lru_nolock(struct ldlm_lock *lock)
248 {
249 	struct ldlm_namespace *ns = ldlm_lock_to_ns(lock);
250 
251 	lock->l_last_used = cfs_time_current();
252 	LASSERT(list_empty(&lock->l_lru));
253 	LASSERT(lock->l_resource->lr_type != LDLM_FLOCK);
254 	list_add_tail(&lock->l_lru, &ns->ns_unused_list);
255 	if (lock->l_flags & LDLM_FL_SKIPPED)
256 		lock->l_flags &= ~LDLM_FL_SKIPPED;
257 	LASSERT(ns->ns_nr_unused >= 0);
258 	ns->ns_nr_unused++;
259 }
260 
261 /**
262  * Adds LDLM lock \a lock to namespace LRU. Obtains necessary LRU locks
263  * first.
264  */
ldlm_lock_add_to_lru(struct ldlm_lock * lock)265 static void ldlm_lock_add_to_lru(struct ldlm_lock *lock)
266 {
267 	struct ldlm_namespace *ns = ldlm_lock_to_ns(lock);
268 
269 	spin_lock(&ns->ns_lock);
270 	ldlm_lock_add_to_lru_nolock(lock);
271 	spin_unlock(&ns->ns_lock);
272 }
273 
274 /**
275  * Moves LDLM lock \a lock that is already in namespace LRU to the tail of
276  * the LRU. Performs necessary LRU locking
277  */
ldlm_lock_touch_in_lru(struct ldlm_lock * lock)278 static void ldlm_lock_touch_in_lru(struct ldlm_lock *lock)
279 {
280 	struct ldlm_namespace *ns = ldlm_lock_to_ns(lock);
281 
282 	spin_lock(&ns->ns_lock);
283 	if (!list_empty(&lock->l_lru)) {
284 		ldlm_lock_remove_from_lru_nolock(lock);
285 		ldlm_lock_add_to_lru_nolock(lock);
286 	}
287 	spin_unlock(&ns->ns_lock);
288 }
289 
290 /**
291  * Helper to destroy a locked lock.
292  *
293  * Used by ldlm_lock_destroy and ldlm_lock_destroy_nolock
294  * Must be called with l_lock and lr_lock held.
295  *
296  * Does not actually free the lock data, but rather marks the lock as
297  * destroyed by setting l_destroyed field in the lock to 1.  Destroys a
298  * handle->lock association too, so that the lock can no longer be found
299  * and removes the lock from LRU list.  Actual lock freeing occurs when
300  * last lock reference goes away.
301  *
302  * Original comment (of some historical value):
303  * This used to have a 'strict' flag, which recovery would use to mark an
304  * in-use lock as needing-to-die.  Lest I am ever tempted to put it back, I
305  * shall explain why it's gone: with the new hash table scheme, once you call
306  * ldlm_lock_destroy, you can never drop your final references on this lock.
307  * Because it's not in the hash table anymore.  -phil
308  */
ldlm_lock_destroy_internal(struct ldlm_lock * lock)309 static int ldlm_lock_destroy_internal(struct ldlm_lock *lock)
310 {
311 	if (lock->l_readers || lock->l_writers) {
312 		LDLM_ERROR(lock, "lock still has references");
313 		LBUG();
314 	}
315 
316 	if (!list_empty(&lock->l_res_link)) {
317 		LDLM_ERROR(lock, "lock still on resource");
318 		LBUG();
319 	}
320 
321 	if (lock->l_flags & LDLM_FL_DESTROYED) {
322 		LASSERT(list_empty(&lock->l_lru));
323 		return 0;
324 	}
325 	lock->l_flags |= LDLM_FL_DESTROYED;
326 
327 	if (lock->l_export && lock->l_export->exp_lock_hash) {
328 		/* NB: it's safe to call cfs_hash_del() even lock isn't
329 		 * in exp_lock_hash. */
330 		/* In the function below, .hs_keycmp resolves to
331 		 * ldlm_export_lock_keycmp() */
332 		/* coverity[overrun-buffer-val] */
333 		cfs_hash_del(lock->l_export->exp_lock_hash,
334 			     &lock->l_remote_handle, &lock->l_exp_hash);
335 	}
336 
337 	ldlm_lock_remove_from_lru(lock);
338 	class_handle_unhash(&lock->l_handle);
339 
340 #if 0
341 	/* Wake anyone waiting for this lock */
342 	/* FIXME: I should probably add yet another flag, instead of using
343 	 * l_export to only call this on clients */
344 	if (lock->l_export)
345 		class_export_put(lock->l_export);
346 	lock->l_export = NULL;
347 	if (lock->l_export && lock->l_completion_ast)
348 		lock->l_completion_ast(lock, 0);
349 #endif
350 	return 1;
351 }
352 
353 /**
354  * Destroys a LDLM lock \a lock. Performs necessary locking first.
355  */
ldlm_lock_destroy(struct ldlm_lock * lock)356 static void ldlm_lock_destroy(struct ldlm_lock *lock)
357 {
358 	int first;
359 
360 	lock_res_and_lock(lock);
361 	first = ldlm_lock_destroy_internal(lock);
362 	unlock_res_and_lock(lock);
363 
364 	/* drop reference from hashtable only for first destroy */
365 	if (first) {
366 		lu_ref_del(&lock->l_reference, "hash", lock);
367 		LDLM_LOCK_RELEASE(lock);
368 	}
369 }
370 
371 /**
372  * Destroys a LDLM lock \a lock that is already locked.
373  */
ldlm_lock_destroy_nolock(struct ldlm_lock * lock)374 void ldlm_lock_destroy_nolock(struct ldlm_lock *lock)
375 {
376 	int first;
377 
378 	first = ldlm_lock_destroy_internal(lock);
379 	/* drop reference from hashtable only for first destroy */
380 	if (first) {
381 		lu_ref_del(&lock->l_reference, "hash", lock);
382 		LDLM_LOCK_RELEASE(lock);
383 	}
384 }
385 
386 /* this is called by portals_handle2object with the handle lock taken */
lock_handle_addref(void * lock)387 static void lock_handle_addref(void *lock)
388 {
389 	LDLM_LOCK_GET((struct ldlm_lock *)lock);
390 }
391 
lock_handle_free(void * lock,int size)392 static void lock_handle_free(void *lock, int size)
393 {
394 	LASSERT(size == sizeof(struct ldlm_lock));
395 	kmem_cache_free(ldlm_lock_slab, lock);
396 }
397 
398 static struct portals_handle_ops lock_handle_ops = {
399 	.hop_addref = lock_handle_addref,
400 	.hop_free   = lock_handle_free,
401 };
402 
403 /**
404  *
405  * Allocate and initialize new lock structure.
406  *
407  * usage: pass in a resource on which you have done ldlm_resource_get
408  *	new lock will take over the refcount.
409  * returns: lock with refcount 2 - one for current caller and one for remote
410  */
ldlm_lock_new(struct ldlm_resource * resource)411 static struct ldlm_lock *ldlm_lock_new(struct ldlm_resource *resource)
412 {
413 	struct ldlm_lock *lock;
414 
415 	if (resource == NULL)
416 		LBUG();
417 
418 	lock = kmem_cache_alloc(ldlm_lock_slab, GFP_NOFS | __GFP_ZERO);
419 	if (lock == NULL)
420 		return NULL;
421 
422 	spin_lock_init(&lock->l_lock);
423 	lock->l_resource = resource;
424 	lu_ref_add(&resource->lr_reference, "lock", lock);
425 
426 	atomic_set(&lock->l_refc, 2);
427 	INIT_LIST_HEAD(&lock->l_res_link);
428 	INIT_LIST_HEAD(&lock->l_lru);
429 	INIT_LIST_HEAD(&lock->l_pending_chain);
430 	INIT_LIST_HEAD(&lock->l_bl_ast);
431 	INIT_LIST_HEAD(&lock->l_cp_ast);
432 	INIT_LIST_HEAD(&lock->l_rk_ast);
433 	init_waitqueue_head(&lock->l_waitq);
434 	lock->l_blocking_lock = NULL;
435 	INIT_LIST_HEAD(&lock->l_sl_mode);
436 	INIT_LIST_HEAD(&lock->l_sl_policy);
437 	INIT_HLIST_NODE(&lock->l_exp_hash);
438 	INIT_HLIST_NODE(&lock->l_exp_flock_hash);
439 
440 	lprocfs_counter_incr(ldlm_res_to_ns(resource)->ns_stats,
441 			     LDLM_NSS_LOCKS);
442 	INIT_LIST_HEAD(&lock->l_handle.h_link);
443 	class_handle_hash(&lock->l_handle, &lock_handle_ops);
444 
445 	lu_ref_init(&lock->l_reference);
446 	lu_ref_add(&lock->l_reference, "hash", lock);
447 	lock->l_callback_timeout = 0;
448 
449 #if LUSTRE_TRACKS_LOCK_EXP_REFS
450 	INIT_LIST_HEAD(&lock->l_exp_refs_link);
451 	lock->l_exp_refs_nr = 0;
452 	lock->l_exp_refs_target = NULL;
453 #endif
454 	INIT_LIST_HEAD(&lock->l_exp_list);
455 
456 	return lock;
457 }
458 
459 /**
460  * Moves LDLM lock \a lock to another resource.
461  * This is used on client when server returns some other lock than requested
462  * (typically as a result of intent operation)
463  */
ldlm_lock_change_resource(struct ldlm_namespace * ns,struct ldlm_lock * lock,const struct ldlm_res_id * new_resid)464 int ldlm_lock_change_resource(struct ldlm_namespace *ns, struct ldlm_lock *lock,
465 			      const struct ldlm_res_id *new_resid)
466 {
467 	struct ldlm_resource *oldres = lock->l_resource;
468 	struct ldlm_resource *newres;
469 	int type;
470 
471 	lock_res_and_lock(lock);
472 	if (memcmp(new_resid, &lock->l_resource->lr_name,
473 		   sizeof(lock->l_resource->lr_name)) == 0) {
474 		/* Nothing to do */
475 		unlock_res_and_lock(lock);
476 		return 0;
477 	}
478 
479 	LASSERT(new_resid->name[0] != 0);
480 
481 	/* This function assumes that the lock isn't on any lists */
482 	LASSERT(list_empty(&lock->l_res_link));
483 
484 	type = oldres->lr_type;
485 	unlock_res_and_lock(lock);
486 
487 	newres = ldlm_resource_get(ns, NULL, new_resid, type, 1);
488 	if (newres == NULL)
489 		return -ENOMEM;
490 
491 	lu_ref_add(&newres->lr_reference, "lock", lock);
492 	/*
493 	 * To flip the lock from the old to the new resource, lock, oldres and
494 	 * newres have to be locked. Resource spin-locks are nested within
495 	 * lock->l_lock, and are taken in the memory address order to avoid
496 	 * dead-locks.
497 	 */
498 	spin_lock(&lock->l_lock);
499 	oldres = lock->l_resource;
500 	if (oldres < newres) {
501 		lock_res(oldres);
502 		lock_res_nested(newres, LRT_NEW);
503 	} else {
504 		lock_res(newres);
505 		lock_res_nested(oldres, LRT_NEW);
506 	}
507 	LASSERT(memcmp(new_resid, &oldres->lr_name,
508 		       sizeof(oldres->lr_name)) != 0);
509 	lock->l_resource = newres;
510 	unlock_res(oldres);
511 	unlock_res_and_lock(lock);
512 
513 	/* ...and the flowers are still standing! */
514 	lu_ref_del(&oldres->lr_reference, "lock", lock);
515 	ldlm_resource_putref(oldres);
516 
517 	return 0;
518 }
519 EXPORT_SYMBOL(ldlm_lock_change_resource);
520 
521 /** \defgroup ldlm_handles LDLM HANDLES
522  * Ways to get hold of locks without any addresses.
523  * @{
524  */
525 
526 /**
527  * Fills in handle for LDLM lock \a lock into supplied \a lockh
528  * Does not take any references.
529  */
ldlm_lock2handle(const struct ldlm_lock * lock,struct lustre_handle * lockh)530 void ldlm_lock2handle(const struct ldlm_lock *lock, struct lustre_handle *lockh)
531 {
532 	lockh->cookie = lock->l_handle.h_cookie;
533 }
534 EXPORT_SYMBOL(ldlm_lock2handle);
535 
536 /**
537  * Obtain a lock reference by handle.
538  *
539  * if \a flags: atomically get the lock and set the flags.
540  *	      Return NULL if flag already set
541  */
__ldlm_handle2lock(const struct lustre_handle * handle,__u64 flags)542 struct ldlm_lock *__ldlm_handle2lock(const struct lustre_handle *handle,
543 				     __u64 flags)
544 {
545 	struct ldlm_lock *lock;
546 
547 	LASSERT(handle);
548 
549 	lock = class_handle2object(handle->cookie);
550 	if (lock == NULL)
551 		return NULL;
552 
553 	/* It's unlikely but possible that someone marked the lock as
554 	 * destroyed after we did handle2object on it */
555 	if (flags == 0 && ((lock->l_flags & LDLM_FL_DESTROYED) == 0)) {
556 		lu_ref_add(&lock->l_reference, "handle", current);
557 		return lock;
558 	}
559 
560 	lock_res_and_lock(lock);
561 
562 	LASSERT(lock->l_resource != NULL);
563 
564 	lu_ref_add_atomic(&lock->l_reference, "handle", current);
565 	if (unlikely(lock->l_flags & LDLM_FL_DESTROYED)) {
566 		unlock_res_and_lock(lock);
567 		CDEBUG(D_INFO, "lock already destroyed: lock %p\n", lock);
568 		LDLM_LOCK_PUT(lock);
569 		return NULL;
570 	}
571 
572 	if (flags && (lock->l_flags & flags)) {
573 		unlock_res_and_lock(lock);
574 		LDLM_LOCK_PUT(lock);
575 		return NULL;
576 	}
577 
578 	if (flags)
579 		lock->l_flags |= flags;
580 
581 	unlock_res_and_lock(lock);
582 	return lock;
583 }
584 EXPORT_SYMBOL(__ldlm_handle2lock);
585 /** @} ldlm_handles */
586 
587 /**
588  * Fill in "on the wire" representation for given LDLM lock into supplied
589  * lock descriptor \a desc structure.
590  */
ldlm_lock2desc(struct ldlm_lock * lock,struct ldlm_lock_desc * desc)591 void ldlm_lock2desc(struct ldlm_lock *lock, struct ldlm_lock_desc *desc)
592 {
593 	ldlm_res2desc(lock->l_resource, &desc->l_resource);
594 	desc->l_req_mode = lock->l_req_mode;
595 	desc->l_granted_mode = lock->l_granted_mode;
596 	ldlm_convert_policy_to_wire(lock->l_resource->lr_type,
597 				    &lock->l_policy_data,
598 				    &desc->l_policy_data);
599 }
600 EXPORT_SYMBOL(ldlm_lock2desc);
601 
602 /**
603  * Add a lock to list of conflicting locks to send AST to.
604  *
605  * Only add if we have not sent a blocking AST to the lock yet.
606  */
ldlm_add_bl_work_item(struct ldlm_lock * lock,struct ldlm_lock * new,struct list_head * work_list)607 static void ldlm_add_bl_work_item(struct ldlm_lock *lock, struct ldlm_lock *new,
608 				  struct list_head *work_list)
609 {
610 	if ((lock->l_flags & LDLM_FL_AST_SENT) == 0) {
611 		LDLM_DEBUG(lock, "lock incompatible; sending blocking AST.");
612 		lock->l_flags |= LDLM_FL_AST_SENT;
613 		/* If the enqueuing client said so, tell the AST recipient to
614 		 * discard dirty data, rather than writing back. */
615 		if (new->l_flags & LDLM_FL_AST_DISCARD_DATA)
616 			lock->l_flags |= LDLM_FL_DISCARD_DATA;
617 		LASSERT(list_empty(&lock->l_bl_ast));
618 		list_add(&lock->l_bl_ast, work_list);
619 		LDLM_LOCK_GET(lock);
620 		LASSERT(lock->l_blocking_lock == NULL);
621 		lock->l_blocking_lock = LDLM_LOCK_GET(new);
622 	}
623 }
624 
625 /**
626  * Add a lock to list of just granted locks to send completion AST to.
627  */
ldlm_add_cp_work_item(struct ldlm_lock * lock,struct list_head * work_list)628 static void ldlm_add_cp_work_item(struct ldlm_lock *lock,
629 				  struct list_head *work_list)
630 {
631 	if ((lock->l_flags & LDLM_FL_CP_REQD) == 0) {
632 		lock->l_flags |= LDLM_FL_CP_REQD;
633 		LDLM_DEBUG(lock, "lock granted; sending completion AST.");
634 		LASSERT(list_empty(&lock->l_cp_ast));
635 		list_add(&lock->l_cp_ast, work_list);
636 		LDLM_LOCK_GET(lock);
637 	}
638 }
639 
640 /**
641  * Aggregator function to add AST work items into a list. Determines
642  * what sort of an AST work needs to be done and calls the proper
643  * adding function.
644  * Must be called with lr_lock held.
645  */
ldlm_add_ast_work_item(struct ldlm_lock * lock,struct ldlm_lock * new,struct list_head * work_list)646 static void ldlm_add_ast_work_item(struct ldlm_lock *lock,
647 				   struct ldlm_lock *new,
648 				   struct list_head *work_list)
649 {
650 	check_res_locked(lock->l_resource);
651 	if (new)
652 		ldlm_add_bl_work_item(lock, new, work_list);
653 	else
654 		ldlm_add_cp_work_item(lock, work_list);
655 }
656 
657 /**
658  * Add specified reader/writer reference to LDLM lock with handle \a lockh.
659  * r/w reference type is determined by \a mode
660  * Calls ldlm_lock_addref_internal.
661  */
ldlm_lock_addref(struct lustre_handle * lockh,__u32 mode)662 void ldlm_lock_addref(struct lustre_handle *lockh, __u32 mode)
663 {
664 	struct ldlm_lock *lock;
665 
666 	lock = ldlm_handle2lock(lockh);
667 	LASSERT(lock != NULL);
668 	ldlm_lock_addref_internal(lock, mode);
669 	LDLM_LOCK_PUT(lock);
670 }
671 EXPORT_SYMBOL(ldlm_lock_addref);
672 
673 /**
674  * Helper function.
675  * Add specified reader/writer reference to LDLM lock \a lock.
676  * r/w reference type is determined by \a mode
677  * Removes lock from LRU if it is there.
678  * Assumes the LDLM lock is already locked.
679  */
ldlm_lock_addref_internal_nolock(struct ldlm_lock * lock,__u32 mode)680 void ldlm_lock_addref_internal_nolock(struct ldlm_lock *lock, __u32 mode)
681 {
682 	ldlm_lock_remove_from_lru(lock);
683 	if (mode & (LCK_NL | LCK_CR | LCK_PR)) {
684 		lock->l_readers++;
685 		lu_ref_add_atomic(&lock->l_reference, "reader", lock);
686 	}
687 	if (mode & (LCK_EX | LCK_CW | LCK_PW | LCK_GROUP | LCK_COS)) {
688 		lock->l_writers++;
689 		lu_ref_add_atomic(&lock->l_reference, "writer", lock);
690 	}
691 	LDLM_LOCK_GET(lock);
692 	lu_ref_add_atomic(&lock->l_reference, "user", lock);
693 	LDLM_DEBUG(lock, "ldlm_lock_addref(%s)", ldlm_lockname[mode]);
694 }
695 
696 /**
697  * Attempts to add reader/writer reference to a lock with handle \a lockh, and
698  * fails if lock is already LDLM_FL_CBPENDING or destroyed.
699  *
700  * \retval 0 success, lock was addref-ed
701  *
702  * \retval -EAGAIN lock is being canceled.
703  */
ldlm_lock_addref_try(struct lustre_handle * lockh,__u32 mode)704 int ldlm_lock_addref_try(struct lustre_handle *lockh, __u32 mode)
705 {
706 	struct ldlm_lock *lock;
707 	int	       result;
708 
709 	result = -EAGAIN;
710 	lock = ldlm_handle2lock(lockh);
711 	if (lock != NULL) {
712 		lock_res_and_lock(lock);
713 		if (lock->l_readers != 0 || lock->l_writers != 0 ||
714 		    !(lock->l_flags & LDLM_FL_CBPENDING)) {
715 			ldlm_lock_addref_internal_nolock(lock, mode);
716 			result = 0;
717 		}
718 		unlock_res_and_lock(lock);
719 		LDLM_LOCK_PUT(lock);
720 	}
721 	return result;
722 }
723 EXPORT_SYMBOL(ldlm_lock_addref_try);
724 
725 /**
726  * Add specified reader/writer reference to LDLM lock \a lock.
727  * Locks LDLM lock and calls ldlm_lock_addref_internal_nolock to do the work.
728  * Only called for local locks.
729  */
ldlm_lock_addref_internal(struct ldlm_lock * lock,__u32 mode)730 void ldlm_lock_addref_internal(struct ldlm_lock *lock, __u32 mode)
731 {
732 	lock_res_and_lock(lock);
733 	ldlm_lock_addref_internal_nolock(lock, mode);
734 	unlock_res_and_lock(lock);
735 }
736 
737 /**
738  * Removes reader/writer reference for LDLM lock \a lock.
739  * Assumes LDLM lock is already locked.
740  * only called in ldlm_flock_destroy and for local locks.
741  * Does NOT add lock to LRU if no r/w references left to accommodate flock locks
742  * that cannot be placed in LRU.
743  */
ldlm_lock_decref_internal_nolock(struct ldlm_lock * lock,__u32 mode)744 void ldlm_lock_decref_internal_nolock(struct ldlm_lock *lock, __u32 mode)
745 {
746 	LDLM_DEBUG(lock, "ldlm_lock_decref(%s)", ldlm_lockname[mode]);
747 	if (mode & (LCK_NL | LCK_CR | LCK_PR)) {
748 		LASSERT(lock->l_readers > 0);
749 		lu_ref_del(&lock->l_reference, "reader", lock);
750 		lock->l_readers--;
751 	}
752 	if (mode & (LCK_EX | LCK_CW | LCK_PW | LCK_GROUP | LCK_COS)) {
753 		LASSERT(lock->l_writers > 0);
754 		lu_ref_del(&lock->l_reference, "writer", lock);
755 		lock->l_writers--;
756 	}
757 
758 	lu_ref_del(&lock->l_reference, "user", lock);
759 	LDLM_LOCK_RELEASE(lock);    /* matches the LDLM_LOCK_GET() in addref */
760 }
761 
762 /**
763  * Removes reader/writer reference for LDLM lock \a lock.
764  * Locks LDLM lock first.
765  * If the lock is determined to be client lock on a client and r/w refcount
766  * drops to zero and the lock is not blocked, the lock is added to LRU lock
767  * on the namespace.
768  * For blocked LDLM locks if r/w count drops to zero, blocking_ast is called.
769  */
ldlm_lock_decref_internal(struct ldlm_lock * lock,__u32 mode)770 void ldlm_lock_decref_internal(struct ldlm_lock *lock, __u32 mode)
771 {
772 	struct ldlm_namespace *ns;
773 
774 	lock_res_and_lock(lock);
775 
776 	ns = ldlm_lock_to_ns(lock);
777 
778 	ldlm_lock_decref_internal_nolock(lock, mode);
779 
780 	if (lock->l_flags & LDLM_FL_LOCAL &&
781 	    !lock->l_readers && !lock->l_writers) {
782 		/* If this is a local lock on a server namespace and this was
783 		 * the last reference, cancel the lock. */
784 		CDEBUG(D_INFO, "forcing cancel of local lock\n");
785 		lock->l_flags |= LDLM_FL_CBPENDING;
786 	}
787 
788 	if (!lock->l_readers && !lock->l_writers &&
789 	    (lock->l_flags & LDLM_FL_CBPENDING)) {
790 		/* If we received a blocked AST and this was the last reference,
791 		 * run the callback. */
792 
793 		LDLM_DEBUG(lock, "final decref done on cbpending lock");
794 
795 		LDLM_LOCK_GET(lock); /* dropped by bl thread */
796 		ldlm_lock_remove_from_lru(lock);
797 		unlock_res_and_lock(lock);
798 
799 		if (lock->l_flags & LDLM_FL_FAIL_LOC)
800 			OBD_RACE(OBD_FAIL_LDLM_CP_BL_RACE);
801 
802 		if ((lock->l_flags & LDLM_FL_ATOMIC_CB) ||
803 		    ldlm_bl_to_thread_lock(ns, NULL, lock) != 0)
804 			ldlm_handle_bl_callback(ns, NULL, lock);
805 	} else if (!lock->l_readers && !lock->l_writers &&
806 		   !(lock->l_flags & LDLM_FL_NO_LRU) &&
807 		   !(lock->l_flags & LDLM_FL_BL_AST)) {
808 
809 		LDLM_DEBUG(lock, "add lock into lru list");
810 
811 		/* If this is a client-side namespace and this was the last
812 		 * reference, put it on the LRU. */
813 		ldlm_lock_add_to_lru(lock);
814 		unlock_res_and_lock(lock);
815 
816 		if (lock->l_flags & LDLM_FL_FAIL_LOC)
817 			OBD_RACE(OBD_FAIL_LDLM_CP_BL_RACE);
818 
819 		/* Call ldlm_cancel_lru() only if EARLY_CANCEL and LRU RESIZE
820 		 * are not supported by the server, otherwise, it is done on
821 		 * enqueue. */
822 		if (!exp_connect_cancelset(lock->l_conn_export) &&
823 		    !ns_connect_lru_resize(ns))
824 			ldlm_cancel_lru(ns, 0, LCF_ASYNC, 0);
825 	} else {
826 		LDLM_DEBUG(lock, "do not add lock into lru list");
827 		unlock_res_and_lock(lock);
828 	}
829 }
830 
831 /**
832  * Decrease reader/writer refcount for LDLM lock with handle \a lockh
833  */
ldlm_lock_decref(struct lustre_handle * lockh,__u32 mode)834 void ldlm_lock_decref(struct lustre_handle *lockh, __u32 mode)
835 {
836 	struct ldlm_lock *lock = __ldlm_handle2lock(lockh, 0);
837 
838 	LASSERTF(lock != NULL, "Non-existing lock: %#llx\n", lockh->cookie);
839 	ldlm_lock_decref_internal(lock, mode);
840 	LDLM_LOCK_PUT(lock);
841 }
842 EXPORT_SYMBOL(ldlm_lock_decref);
843 
844 /**
845  * Decrease reader/writer refcount for LDLM lock with handle
846  * \a lockh and mark it for subsequent cancellation once r/w refcount
847  * drops to zero instead of putting into LRU.
848  *
849  * Typical usage is for GROUP locks which we cannot allow to be cached.
850  */
ldlm_lock_decref_and_cancel(struct lustre_handle * lockh,__u32 mode)851 void ldlm_lock_decref_and_cancel(struct lustre_handle *lockh, __u32 mode)
852 {
853 	struct ldlm_lock *lock = __ldlm_handle2lock(lockh, 0);
854 
855 	LASSERT(lock != NULL);
856 
857 	LDLM_DEBUG(lock, "ldlm_lock_decref(%s)", ldlm_lockname[mode]);
858 	lock_res_and_lock(lock);
859 	lock->l_flags |= LDLM_FL_CBPENDING;
860 	unlock_res_and_lock(lock);
861 	ldlm_lock_decref_internal(lock, mode);
862 	LDLM_LOCK_PUT(lock);
863 }
864 EXPORT_SYMBOL(ldlm_lock_decref_and_cancel);
865 
866 struct sl_insert_point {
867 	struct list_head *res_link;
868 	struct list_head *mode_link;
869 	struct list_head *policy_link;
870 };
871 
872 /**
873  * Finds a position to insert the new lock into granted lock list.
874  *
875  * Used for locks eligible for skiplist optimization.
876  *
877  * Parameters:
878  *      queue [input]:  the granted list where search acts on;
879  *      req [input]:    the lock whose position to be located;
880  *      prev [output]:  positions within 3 lists to insert @req to
881  * Return Value:
882  *      filled @prev
883  * NOTE: called by
884  *  - ldlm_grant_lock_with_skiplist
885  */
search_granted_lock(struct list_head * queue,struct ldlm_lock * req,struct sl_insert_point * prev)886 static void search_granted_lock(struct list_head *queue,
887 				struct ldlm_lock *req,
888 				struct sl_insert_point *prev)
889 {
890 	struct list_head *tmp;
891 	struct ldlm_lock *lock, *mode_end, *policy_end;
892 
893 	list_for_each(tmp, queue) {
894 		lock = list_entry(tmp, struct ldlm_lock, l_res_link);
895 
896 		mode_end = list_entry(lock->l_sl_mode.prev,
897 					  struct ldlm_lock, l_sl_mode);
898 
899 		if (lock->l_req_mode != req->l_req_mode) {
900 			/* jump to last lock of mode group */
901 			tmp = &mode_end->l_res_link;
902 			continue;
903 		}
904 
905 		/* suitable mode group is found */
906 		if (lock->l_resource->lr_type == LDLM_PLAIN) {
907 			/* insert point is last lock of the mode group */
908 			prev->res_link = &mode_end->l_res_link;
909 			prev->mode_link = &mode_end->l_sl_mode;
910 			prev->policy_link = &req->l_sl_policy;
911 			return;
912 		}
913 
914 		if (lock->l_resource->lr_type == LDLM_IBITS) {
915 			for (;;) {
916 				policy_end =
917 					list_entry(lock->l_sl_policy.prev,
918 						       struct ldlm_lock,
919 						       l_sl_policy);
920 
921 				if (lock->l_policy_data.l_inodebits.bits ==
922 				    req->l_policy_data.l_inodebits.bits) {
923 					/* insert point is last lock of
924 					 * the policy group */
925 					prev->res_link =
926 						&policy_end->l_res_link;
927 					prev->mode_link =
928 						&policy_end->l_sl_mode;
929 					prev->policy_link =
930 						&policy_end->l_sl_policy;
931 					return;
932 				}
933 
934 				if (policy_end == mode_end)
935 					/* done with mode group */
936 					break;
937 
938 				/* go to next policy group within mode group */
939 				tmp = policy_end->l_res_link.next;
940 				lock = list_entry(tmp, struct ldlm_lock,
941 						      l_res_link);
942 			}  /* loop over policy groups within the mode group */
943 
944 			/* insert point is last lock of the mode group,
945 			 * new policy group is started */
946 			prev->res_link = &mode_end->l_res_link;
947 			prev->mode_link = &mode_end->l_sl_mode;
948 			prev->policy_link = &req->l_sl_policy;
949 			return;
950 		}
951 
952 		LDLM_ERROR(lock, "is not LDLM_PLAIN or LDLM_IBITS lock");
953 		LBUG();
954 	}
955 
956 	/* insert point is last lock on the queue,
957 	 * new mode group and new policy group are started */
958 	prev->res_link = queue->prev;
959 	prev->mode_link = &req->l_sl_mode;
960 	prev->policy_link = &req->l_sl_policy;
961 }
962 
963 /**
964  * Add a lock into resource granted list after a position described by
965  * \a prev.
966  */
ldlm_granted_list_add_lock(struct ldlm_lock * lock,struct sl_insert_point * prev)967 static void ldlm_granted_list_add_lock(struct ldlm_lock *lock,
968 				       struct sl_insert_point *prev)
969 {
970 	struct ldlm_resource *res = lock->l_resource;
971 
972 	check_res_locked(res);
973 
974 	ldlm_resource_dump(D_INFO, res);
975 	LDLM_DEBUG(lock, "About to add lock:");
976 
977 	if (lock->l_flags & LDLM_FL_DESTROYED) {
978 		CDEBUG(D_OTHER, "Lock destroyed, not adding to resource\n");
979 		return;
980 	}
981 
982 	LASSERT(list_empty(&lock->l_res_link));
983 	LASSERT(list_empty(&lock->l_sl_mode));
984 	LASSERT(list_empty(&lock->l_sl_policy));
985 
986 	/*
987 	 * lock->link == prev->link means lock is first starting the group.
988 	 * Don't re-add to itself to suppress kernel warnings.
989 	 */
990 	if (&lock->l_res_link != prev->res_link)
991 		list_add(&lock->l_res_link, prev->res_link);
992 	if (&lock->l_sl_mode != prev->mode_link)
993 		list_add(&lock->l_sl_mode, prev->mode_link);
994 	if (&lock->l_sl_policy != prev->policy_link)
995 		list_add(&lock->l_sl_policy, prev->policy_link);
996 }
997 
998 /**
999  * Add a lock to granted list on a resource maintaining skiplist
1000  * correctness.
1001  */
ldlm_grant_lock_with_skiplist(struct ldlm_lock * lock)1002 static void ldlm_grant_lock_with_skiplist(struct ldlm_lock *lock)
1003 {
1004 	struct sl_insert_point prev;
1005 
1006 	LASSERT(lock->l_req_mode == lock->l_granted_mode);
1007 
1008 	search_granted_lock(&lock->l_resource->lr_granted, lock, &prev);
1009 	ldlm_granted_list_add_lock(lock, &prev);
1010 }
1011 
1012 /**
1013  * Perform lock granting bookkeeping.
1014  *
1015  * Includes putting the lock into granted list and updating lock mode.
1016  * NOTE: called by
1017  *  - ldlm_lock_enqueue
1018  *  - ldlm_reprocess_queue
1019  *  - ldlm_lock_convert
1020  *
1021  * must be called with lr_lock held
1022  */
ldlm_grant_lock(struct ldlm_lock * lock,struct list_head * work_list)1023 void ldlm_grant_lock(struct ldlm_lock *lock, struct list_head *work_list)
1024 {
1025 	struct ldlm_resource *res = lock->l_resource;
1026 
1027 	check_res_locked(res);
1028 
1029 	lock->l_granted_mode = lock->l_req_mode;
1030 	if (res->lr_type == LDLM_PLAIN || res->lr_type == LDLM_IBITS)
1031 		ldlm_grant_lock_with_skiplist(lock);
1032 	else if (res->lr_type == LDLM_EXTENT)
1033 		ldlm_extent_add_lock(res, lock);
1034 	else
1035 		ldlm_resource_add_lock(res, &res->lr_granted, lock);
1036 
1037 	if (lock->l_granted_mode < res->lr_most_restr)
1038 		res->lr_most_restr = lock->l_granted_mode;
1039 
1040 	if (work_list && lock->l_completion_ast != NULL)
1041 		ldlm_add_ast_work_item(lock, NULL, work_list);
1042 
1043 	ldlm_pool_add(&ldlm_res_to_ns(res)->ns_pool, lock);
1044 }
1045 
1046 /**
1047  * Search for a lock with given properties in a queue.
1048  *
1049  * \retval a referenced lock or NULL.  See the flag descriptions below, in the
1050  * comment above ldlm_lock_match
1051  */
search_queue(struct list_head * queue,ldlm_mode_t * mode,ldlm_policy_data_t * policy,struct ldlm_lock * old_lock,__u64 flags,int unref)1052 static struct ldlm_lock *search_queue(struct list_head *queue,
1053 				      ldlm_mode_t *mode,
1054 				      ldlm_policy_data_t *policy,
1055 				      struct ldlm_lock *old_lock,
1056 				      __u64 flags, int unref)
1057 {
1058 	struct ldlm_lock *lock;
1059 	struct list_head       *tmp;
1060 
1061 	list_for_each(tmp, queue) {
1062 		ldlm_mode_t match;
1063 
1064 		lock = list_entry(tmp, struct ldlm_lock, l_res_link);
1065 
1066 		if (lock == old_lock)
1067 			break;
1068 
1069 		/* Check if this lock can be matched.
1070 		 * Used by LU-2919(exclusive open) for open lease lock */
1071 		if (ldlm_is_excl(lock))
1072 			continue;
1073 
1074 		/* llite sometimes wants to match locks that will be
1075 		 * canceled when their users drop, but we allow it to match
1076 		 * if it passes in CBPENDING and the lock still has users.
1077 		 * this is generally only going to be used by children
1078 		 * whose parents already hold a lock so forward progress
1079 		 * can still happen. */
1080 		if (lock->l_flags & LDLM_FL_CBPENDING &&
1081 		    !(flags & LDLM_FL_CBPENDING))
1082 			continue;
1083 		if (!unref && lock->l_flags & LDLM_FL_CBPENDING &&
1084 		    lock->l_readers == 0 && lock->l_writers == 0)
1085 			continue;
1086 
1087 		if (!(lock->l_req_mode & *mode))
1088 			continue;
1089 		match = lock->l_req_mode;
1090 
1091 		if (lock->l_resource->lr_type == LDLM_EXTENT &&
1092 		    (lock->l_policy_data.l_extent.start >
1093 		     policy->l_extent.start ||
1094 		     lock->l_policy_data.l_extent.end < policy->l_extent.end))
1095 			continue;
1096 
1097 		if (unlikely(match == LCK_GROUP) &&
1098 		    lock->l_resource->lr_type == LDLM_EXTENT &&
1099 		    lock->l_policy_data.l_extent.gid != policy->l_extent.gid)
1100 			continue;
1101 
1102 		/* We match if we have existing lock with same or wider set
1103 		   of bits. */
1104 		if (lock->l_resource->lr_type == LDLM_IBITS &&
1105 		     ((lock->l_policy_data.l_inodebits.bits &
1106 		      policy->l_inodebits.bits) !=
1107 		      policy->l_inodebits.bits))
1108 			continue;
1109 
1110 		if (!unref && (lock->l_flags & LDLM_FL_GONE_MASK))
1111 			continue;
1112 
1113 		if ((flags & LDLM_FL_LOCAL_ONLY) &&
1114 		    !(lock->l_flags & LDLM_FL_LOCAL))
1115 			continue;
1116 
1117 		if (flags & LDLM_FL_TEST_LOCK) {
1118 			LDLM_LOCK_GET(lock);
1119 			ldlm_lock_touch_in_lru(lock);
1120 		} else {
1121 			ldlm_lock_addref_internal_nolock(lock, match);
1122 		}
1123 		*mode = match;
1124 		return lock;
1125 	}
1126 
1127 	return NULL;
1128 }
1129 
ldlm_lock_fail_match_locked(struct ldlm_lock * lock)1130 void ldlm_lock_fail_match_locked(struct ldlm_lock *lock)
1131 {
1132 	if ((lock->l_flags & LDLM_FL_FAIL_NOTIFIED) == 0) {
1133 		lock->l_flags |= LDLM_FL_FAIL_NOTIFIED;
1134 		wake_up_all(&lock->l_waitq);
1135 	}
1136 }
1137 EXPORT_SYMBOL(ldlm_lock_fail_match_locked);
1138 
1139 /**
1140  * Mark lock as "matchable" by OST.
1141  *
1142  * Used to prevent certain races in LOV/OSC where the lock is granted, but LVB
1143  * is not yet valid.
1144  * Assumes LDLM lock is already locked.
1145  */
ldlm_lock_allow_match_locked(struct ldlm_lock * lock)1146 void ldlm_lock_allow_match_locked(struct ldlm_lock *lock)
1147 {
1148 	lock->l_flags |= LDLM_FL_LVB_READY;
1149 	wake_up_all(&lock->l_waitq);
1150 }
1151 EXPORT_SYMBOL(ldlm_lock_allow_match_locked);
1152 
1153 /**
1154  * Mark lock as "matchable" by OST.
1155  * Locks the lock and then \see ldlm_lock_allow_match_locked
1156  */
ldlm_lock_allow_match(struct ldlm_lock * lock)1157 void ldlm_lock_allow_match(struct ldlm_lock *lock)
1158 {
1159 	lock_res_and_lock(lock);
1160 	ldlm_lock_allow_match_locked(lock);
1161 	unlock_res_and_lock(lock);
1162 }
1163 EXPORT_SYMBOL(ldlm_lock_allow_match);
1164 
1165 /**
1166  * Attempt to find a lock with specified properties.
1167  *
1168  * Typically returns a reference to matched lock unless LDLM_FL_TEST_LOCK is
1169  * set in \a flags
1170  *
1171  * Can be called in two ways:
1172  *
1173  * If 'ns' is NULL, then lockh describes an existing lock that we want to look
1174  * for a duplicate of.
1175  *
1176  * Otherwise, all of the fields must be filled in, to match against.
1177  *
1178  * If 'flags' contains LDLM_FL_LOCAL_ONLY, then only match local locks on the
1179  *     server (ie, connh is NULL)
1180  * If 'flags' contains LDLM_FL_BLOCK_GRANTED, then only locks on the granted
1181  *     list will be considered
1182  * If 'flags' contains LDLM_FL_CBPENDING, then locks that have been marked
1183  *     to be canceled can still be matched as long as they still have reader
1184  *     or writer referneces
1185  * If 'flags' contains LDLM_FL_TEST_LOCK, then don't actually reference a lock,
1186  *     just tell us if we would have matched.
1187  *
1188  * \retval 1 if it finds an already-existing lock that is compatible; in this
1189  * case, lockh is filled in with a addref()ed lock
1190  *
1191  * We also check security context, and if that fails we simply return 0 (to
1192  * keep caller code unchanged), the context failure will be discovered by
1193  * caller sometime later.
1194  */
ldlm_lock_match(struct ldlm_namespace * ns,__u64 flags,const struct ldlm_res_id * res_id,ldlm_type_t type,ldlm_policy_data_t * policy,ldlm_mode_t mode,struct lustre_handle * lockh,int unref)1195 ldlm_mode_t ldlm_lock_match(struct ldlm_namespace *ns, __u64 flags,
1196 			    const struct ldlm_res_id *res_id, ldlm_type_t type,
1197 			    ldlm_policy_data_t *policy, ldlm_mode_t mode,
1198 			    struct lustre_handle *lockh, int unref)
1199 {
1200 	struct ldlm_resource *res;
1201 	struct ldlm_lock *lock, *old_lock = NULL;
1202 	int rc = 0;
1203 
1204 	if (ns == NULL) {
1205 		old_lock = ldlm_handle2lock(lockh);
1206 		LASSERT(old_lock);
1207 
1208 		ns = ldlm_lock_to_ns(old_lock);
1209 		res_id = &old_lock->l_resource->lr_name;
1210 		type = old_lock->l_resource->lr_type;
1211 		mode = old_lock->l_req_mode;
1212 	}
1213 
1214 	res = ldlm_resource_get(ns, NULL, res_id, type, 0);
1215 	if (res == NULL) {
1216 		LASSERT(old_lock == NULL);
1217 		return 0;
1218 	}
1219 
1220 	LDLM_RESOURCE_ADDREF(res);
1221 	lock_res(res);
1222 
1223 	lock = search_queue(&res->lr_granted, &mode, policy, old_lock,
1224 			    flags, unref);
1225 	if (lock != NULL) {
1226 		rc = 1;
1227 		goto out;
1228 	}
1229 	if (flags & LDLM_FL_BLOCK_GRANTED) {
1230 		rc = 0;
1231 		goto out;
1232 	}
1233 	lock = search_queue(&res->lr_waiting, &mode, policy, old_lock,
1234 			    flags, unref);
1235 	if (lock != NULL) {
1236 		rc = 1;
1237 		goto out;
1238 	}
1239 
1240  out:
1241 	unlock_res(res);
1242 	LDLM_RESOURCE_DELREF(res);
1243 	ldlm_resource_putref(res);
1244 
1245 	if (lock) {
1246 		ldlm_lock2handle(lock, lockh);
1247 		if ((flags & LDLM_FL_LVB_READY) &&
1248 		    (!(lock->l_flags & LDLM_FL_LVB_READY))) {
1249 			__u64 wait_flags = LDLM_FL_LVB_READY |
1250 				LDLM_FL_DESTROYED | LDLM_FL_FAIL_NOTIFIED;
1251 			struct l_wait_info lwi;
1252 
1253 			if (lock->l_completion_ast) {
1254 				int err = lock->l_completion_ast(lock,
1255 							  LDLM_FL_WAIT_NOREPROC,
1256 								 NULL);
1257 				if (err) {
1258 					if (flags & LDLM_FL_TEST_LOCK)
1259 						LDLM_LOCK_RELEASE(lock);
1260 					else
1261 						ldlm_lock_decref_internal(lock,
1262 									  mode);
1263 					rc = 0;
1264 					goto out2;
1265 				}
1266 			}
1267 
1268 			lwi = LWI_TIMEOUT_INTR(cfs_time_seconds(obd_timeout),
1269 					       NULL, LWI_ON_SIGNAL_NOOP, NULL);
1270 
1271 			/* XXX FIXME see comment on CAN_MATCH in lustre_dlm.h */
1272 			l_wait_event(lock->l_waitq,
1273 				     lock->l_flags & wait_flags,
1274 				     &lwi);
1275 			if (!(lock->l_flags & LDLM_FL_LVB_READY)) {
1276 				if (flags & LDLM_FL_TEST_LOCK)
1277 					LDLM_LOCK_RELEASE(lock);
1278 				else
1279 					ldlm_lock_decref_internal(lock, mode);
1280 				rc = 0;
1281 			}
1282 		}
1283 	}
1284  out2:
1285 	if (rc) {
1286 		LDLM_DEBUG(lock, "matched (%llu %llu)",
1287 			   (type == LDLM_PLAIN || type == LDLM_IBITS) ?
1288 				res_id->name[2] : policy->l_extent.start,
1289 			   (type == LDLM_PLAIN || type == LDLM_IBITS) ?
1290 				res_id->name[3] : policy->l_extent.end);
1291 
1292 		/* check user's security context */
1293 		if (lock->l_conn_export &&
1294 		    sptlrpc_import_check_ctx(
1295 				class_exp2cliimp(lock->l_conn_export))) {
1296 			if (!(flags & LDLM_FL_TEST_LOCK))
1297 				ldlm_lock_decref_internal(lock, mode);
1298 			rc = 0;
1299 		}
1300 
1301 		if (flags & LDLM_FL_TEST_LOCK)
1302 			LDLM_LOCK_RELEASE(lock);
1303 
1304 	} else if (!(flags & LDLM_FL_TEST_LOCK)) {/*less verbose for test-only*/
1305 		LDLM_DEBUG_NOLOCK("not matched ns %p type %u mode %u res %llu/%llu (%llu %llu)",
1306 				  ns, type, mode, res_id->name[0],
1307 				  res_id->name[1],
1308 				  (type == LDLM_PLAIN || type == LDLM_IBITS) ?
1309 					res_id->name[2] : policy->l_extent.start,
1310 				  (type == LDLM_PLAIN || type == LDLM_IBITS) ?
1311 					res_id->name[3] : policy->l_extent.end);
1312 	}
1313 	if (old_lock)
1314 		LDLM_LOCK_PUT(old_lock);
1315 
1316 	return rc ? mode : 0;
1317 }
1318 EXPORT_SYMBOL(ldlm_lock_match);
1319 
ldlm_revalidate_lock_handle(struct lustre_handle * lockh,__u64 * bits)1320 ldlm_mode_t ldlm_revalidate_lock_handle(struct lustre_handle *lockh,
1321 					__u64 *bits)
1322 {
1323 	struct ldlm_lock *lock;
1324 	ldlm_mode_t mode = 0;
1325 
1326 	lock = ldlm_handle2lock(lockh);
1327 	if (lock != NULL) {
1328 		lock_res_and_lock(lock);
1329 		if (lock->l_flags & LDLM_FL_GONE_MASK)
1330 			goto out;
1331 
1332 		if (lock->l_flags & LDLM_FL_CBPENDING &&
1333 		    lock->l_readers == 0 && lock->l_writers == 0)
1334 			goto out;
1335 
1336 		if (bits)
1337 			*bits = lock->l_policy_data.l_inodebits.bits;
1338 		mode = lock->l_granted_mode;
1339 		ldlm_lock_addref_internal_nolock(lock, mode);
1340 	}
1341 
1342 out:
1343 	if (lock != NULL) {
1344 		unlock_res_and_lock(lock);
1345 		LDLM_LOCK_PUT(lock);
1346 	}
1347 	return mode;
1348 }
1349 EXPORT_SYMBOL(ldlm_revalidate_lock_handle);
1350 
1351 /** The caller must guarantee that the buffer is large enough. */
ldlm_fill_lvb(struct ldlm_lock * lock,struct req_capsule * pill,enum req_location loc,void * data,int size)1352 int ldlm_fill_lvb(struct ldlm_lock *lock, struct req_capsule *pill,
1353 		  enum req_location loc, void *data, int size)
1354 {
1355 	void *lvb;
1356 
1357 	LASSERT(data != NULL);
1358 	LASSERT(size >= 0);
1359 
1360 	switch (lock->l_lvb_type) {
1361 	case LVB_T_OST:
1362 		if (size == sizeof(struct ost_lvb)) {
1363 			if (loc == RCL_CLIENT)
1364 				lvb = req_capsule_client_swab_get(pill,
1365 						&RMF_DLM_LVB,
1366 						lustre_swab_ost_lvb);
1367 			else
1368 				lvb = req_capsule_server_swab_get(pill,
1369 						&RMF_DLM_LVB,
1370 						lustre_swab_ost_lvb);
1371 			if (unlikely(lvb == NULL)) {
1372 				LDLM_ERROR(lock, "no LVB");
1373 				return -EPROTO;
1374 			}
1375 
1376 			memcpy(data, lvb, size);
1377 		} else if (size == sizeof(struct ost_lvb_v1)) {
1378 			struct ost_lvb *olvb = data;
1379 
1380 			if (loc == RCL_CLIENT)
1381 				lvb = req_capsule_client_swab_get(pill,
1382 						&RMF_DLM_LVB,
1383 						lustre_swab_ost_lvb_v1);
1384 			else
1385 				lvb = req_capsule_server_sized_swab_get(pill,
1386 						&RMF_DLM_LVB, size,
1387 						lustre_swab_ost_lvb_v1);
1388 			if (unlikely(lvb == NULL)) {
1389 				LDLM_ERROR(lock, "no LVB");
1390 				return -EPROTO;
1391 			}
1392 
1393 			memcpy(data, lvb, size);
1394 			olvb->lvb_mtime_ns = 0;
1395 			olvb->lvb_atime_ns = 0;
1396 			olvb->lvb_ctime_ns = 0;
1397 		} else {
1398 			LDLM_ERROR(lock, "Replied unexpected ost LVB size %d",
1399 				   size);
1400 			return -EINVAL;
1401 		}
1402 		break;
1403 	case LVB_T_LQUOTA:
1404 		if (size == sizeof(struct lquota_lvb)) {
1405 			if (loc == RCL_CLIENT)
1406 				lvb = req_capsule_client_swab_get(pill,
1407 						&RMF_DLM_LVB,
1408 						lustre_swab_lquota_lvb);
1409 			else
1410 				lvb = req_capsule_server_swab_get(pill,
1411 						&RMF_DLM_LVB,
1412 						lustre_swab_lquota_lvb);
1413 			if (unlikely(lvb == NULL)) {
1414 				LDLM_ERROR(lock, "no LVB");
1415 				return -EPROTO;
1416 			}
1417 
1418 			memcpy(data, lvb, size);
1419 		} else {
1420 			LDLM_ERROR(lock,
1421 				   "Replied unexpected lquota LVB size %d",
1422 				   size);
1423 			return -EINVAL;
1424 		}
1425 		break;
1426 	case LVB_T_LAYOUT:
1427 		if (size == 0)
1428 			break;
1429 
1430 		if (loc == RCL_CLIENT)
1431 			lvb = req_capsule_client_get(pill, &RMF_DLM_LVB);
1432 		else
1433 			lvb = req_capsule_server_get(pill, &RMF_DLM_LVB);
1434 		if (unlikely(lvb == NULL)) {
1435 			LDLM_ERROR(lock, "no LVB");
1436 			return -EPROTO;
1437 		}
1438 
1439 		memcpy(data, lvb, size);
1440 		break;
1441 	default:
1442 		LDLM_ERROR(lock, "Unknown LVB type: %d\n", lock->l_lvb_type);
1443 		dump_stack();
1444 		return -EINVAL;
1445 	}
1446 
1447 	return 0;
1448 }
1449 
1450 /**
1451  * Create and fill in new LDLM lock with specified properties.
1452  * Returns a referenced lock
1453  */
ldlm_lock_create(struct ldlm_namespace * ns,const struct ldlm_res_id * res_id,ldlm_type_t type,ldlm_mode_t mode,const struct ldlm_callback_suite * cbs,void * data,__u32 lvb_len,enum lvb_type lvb_type)1454 struct ldlm_lock *ldlm_lock_create(struct ldlm_namespace *ns,
1455 				   const struct ldlm_res_id *res_id,
1456 				   ldlm_type_t type,
1457 				   ldlm_mode_t mode,
1458 				   const struct ldlm_callback_suite *cbs,
1459 				   void *data, __u32 lvb_len,
1460 				   enum lvb_type lvb_type)
1461 {
1462 	struct ldlm_lock *lock;
1463 	struct ldlm_resource *res;
1464 
1465 	res = ldlm_resource_get(ns, NULL, res_id, type, 1);
1466 	if (res == NULL)
1467 		return NULL;
1468 
1469 	lock = ldlm_lock_new(res);
1470 
1471 	if (lock == NULL)
1472 		return NULL;
1473 
1474 	lock->l_req_mode = mode;
1475 	lock->l_ast_data = data;
1476 	lock->l_pid = current_pid();
1477 	if (cbs) {
1478 		lock->l_blocking_ast = cbs->lcs_blocking;
1479 		lock->l_completion_ast = cbs->lcs_completion;
1480 		lock->l_glimpse_ast = cbs->lcs_glimpse;
1481 	}
1482 
1483 	lock->l_tree_node = NULL;
1484 	/* if this is the extent lock, allocate the interval tree node */
1485 	if (type == LDLM_EXTENT) {
1486 		if (ldlm_interval_alloc(lock) == NULL)
1487 			goto out;
1488 	}
1489 
1490 	if (lvb_len) {
1491 		lock->l_lvb_len = lvb_len;
1492 		lock->l_lvb_data = kzalloc(lvb_len, GFP_NOFS);
1493 		if (!lock->l_lvb_data)
1494 			goto out;
1495 	}
1496 
1497 	lock->l_lvb_type = lvb_type;
1498 	if (OBD_FAIL_CHECK(OBD_FAIL_LDLM_NEW_LOCK))
1499 		goto out;
1500 
1501 	return lock;
1502 
1503 out:
1504 	ldlm_lock_destroy(lock);
1505 	LDLM_LOCK_RELEASE(lock);
1506 	return NULL;
1507 }
1508 
1509 /**
1510  * Enqueue (request) a lock.
1511  * On the client this is called from ldlm_cli_enqueue_fini
1512  * after we already got an initial reply from the server with some status.
1513  *
1514  * Does not block. As a result of enqueue the lock would be put
1515  * into granted or waiting list.
1516  */
ldlm_lock_enqueue(struct ldlm_namespace * ns,struct ldlm_lock ** lockp,void * cookie,__u64 * flags)1517 ldlm_error_t ldlm_lock_enqueue(struct ldlm_namespace *ns,
1518 			       struct ldlm_lock **lockp,
1519 			       void *cookie, __u64 *flags)
1520 {
1521 	struct ldlm_lock *lock = *lockp;
1522 	struct ldlm_resource *res = lock->l_resource;
1523 
1524 	lock->l_last_activity = ktime_get_real_seconds();
1525 
1526 	lock_res_and_lock(lock);
1527 	if (lock->l_req_mode == lock->l_granted_mode) {
1528 		/* The server returned a blocked lock, but it was granted
1529 		 * before we got a chance to actually enqueue it.  We don't
1530 		 * need to do anything else. */
1531 		*flags &= ~(LDLM_FL_BLOCK_GRANTED |
1532 			    LDLM_FL_BLOCK_CONV | LDLM_FL_BLOCK_WAIT);
1533 		goto out;
1534 	}
1535 
1536 	ldlm_resource_unlink_lock(lock);
1537 
1538 	/* Cannot happen unless on the server */
1539 	if (res->lr_type == LDLM_EXTENT && !lock->l_tree_node)
1540 		LBUG();
1541 
1542 	/* Some flags from the enqueue want to make it into the AST, via the
1543 	 * lock's l_flags. */
1544 	lock->l_flags |= *flags & LDLM_FL_AST_DISCARD_DATA;
1545 
1546 	/*
1547 	 * This distinction between local lock trees is very important; a client
1548 	 * namespace only has information about locks taken by that client, and
1549 	 * thus doesn't have enough information to decide for itself if it can
1550 	 * be granted (below).  In this case, we do exactly what the server
1551 	 * tells us to do, as dictated by the 'flags'.
1552 	 */
1553 	if (*flags & (LDLM_FL_BLOCK_WAIT | LDLM_FL_BLOCK_GRANTED))
1554 		ldlm_resource_add_lock(res, &res->lr_waiting, lock);
1555 	else
1556 		ldlm_grant_lock(lock, NULL);
1557 
1558 out:
1559 	unlock_res_and_lock(lock);
1560 	return ELDLM_OK;
1561 }
1562 
1563 /**
1564  * Process a call to blocking AST callback for a lock in ast_work list
1565  */
1566 static int
ldlm_work_bl_ast_lock(struct ptlrpc_request_set * rqset,void * opaq)1567 ldlm_work_bl_ast_lock(struct ptlrpc_request_set *rqset, void *opaq)
1568 {
1569 	struct ldlm_cb_set_arg *arg = opaq;
1570 	struct ldlm_lock_desc   d;
1571 	int		     rc;
1572 	struct ldlm_lock       *lock;
1573 
1574 	if (list_empty(arg->list))
1575 		return -ENOENT;
1576 
1577 	lock = list_entry(arg->list->next, struct ldlm_lock, l_bl_ast);
1578 
1579 	/* nobody should touch l_bl_ast */
1580 	lock_res_and_lock(lock);
1581 	list_del_init(&lock->l_bl_ast);
1582 
1583 	LASSERT(lock->l_flags & LDLM_FL_AST_SENT);
1584 	LASSERT(lock->l_bl_ast_run == 0);
1585 	LASSERT(lock->l_blocking_lock);
1586 	lock->l_bl_ast_run++;
1587 	unlock_res_and_lock(lock);
1588 
1589 	ldlm_lock2desc(lock->l_blocking_lock, &d);
1590 
1591 	rc = lock->l_blocking_ast(lock, &d, (void *)arg, LDLM_CB_BLOCKING);
1592 	LDLM_LOCK_RELEASE(lock->l_blocking_lock);
1593 	lock->l_blocking_lock = NULL;
1594 	LDLM_LOCK_RELEASE(lock);
1595 
1596 	return rc;
1597 }
1598 
1599 /**
1600  * Process a call to completion AST callback for a lock in ast_work list
1601  */
1602 static int
ldlm_work_cp_ast_lock(struct ptlrpc_request_set * rqset,void * opaq)1603 ldlm_work_cp_ast_lock(struct ptlrpc_request_set *rqset, void *opaq)
1604 {
1605 	struct ldlm_cb_set_arg  *arg = opaq;
1606 	int		      rc = 0;
1607 	struct ldlm_lock	*lock;
1608 	ldlm_completion_callback completion_callback;
1609 
1610 	if (list_empty(arg->list))
1611 		return -ENOENT;
1612 
1613 	lock = list_entry(arg->list->next, struct ldlm_lock, l_cp_ast);
1614 
1615 	/* It's possible to receive a completion AST before we've set
1616 	 * the l_completion_ast pointer: either because the AST arrived
1617 	 * before the reply, or simply because there's a small race
1618 	 * window between receiving the reply and finishing the local
1619 	 * enqueue. (bug 842)
1620 	 *
1621 	 * This can't happen with the blocking_ast, however, because we
1622 	 * will never call the local blocking_ast until we drop our
1623 	 * reader/writer reference, which we won't do until we get the
1624 	 * reply and finish enqueueing. */
1625 
1626 	/* nobody should touch l_cp_ast */
1627 	lock_res_and_lock(lock);
1628 	list_del_init(&lock->l_cp_ast);
1629 	LASSERT(lock->l_flags & LDLM_FL_CP_REQD);
1630 	/* save l_completion_ast since it can be changed by
1631 	 * mds_intent_policy(), see bug 14225 */
1632 	completion_callback = lock->l_completion_ast;
1633 	lock->l_flags &= ~LDLM_FL_CP_REQD;
1634 	unlock_res_and_lock(lock);
1635 
1636 	if (completion_callback != NULL)
1637 		rc = completion_callback(lock, 0, (void *)arg);
1638 	LDLM_LOCK_RELEASE(lock);
1639 
1640 	return rc;
1641 }
1642 
1643 /**
1644  * Process a call to revocation AST callback for a lock in ast_work list
1645  */
1646 static int
ldlm_work_revoke_ast_lock(struct ptlrpc_request_set * rqset,void * opaq)1647 ldlm_work_revoke_ast_lock(struct ptlrpc_request_set *rqset, void *opaq)
1648 {
1649 	struct ldlm_cb_set_arg *arg = opaq;
1650 	struct ldlm_lock_desc   desc;
1651 	int		     rc;
1652 	struct ldlm_lock       *lock;
1653 
1654 	if (list_empty(arg->list))
1655 		return -ENOENT;
1656 
1657 	lock = list_entry(arg->list->next, struct ldlm_lock, l_rk_ast);
1658 	list_del_init(&lock->l_rk_ast);
1659 
1660 	/* the desc just pretend to exclusive */
1661 	ldlm_lock2desc(lock, &desc);
1662 	desc.l_req_mode = LCK_EX;
1663 	desc.l_granted_mode = 0;
1664 
1665 	rc = lock->l_blocking_ast(lock, &desc, (void *)arg, LDLM_CB_BLOCKING);
1666 	LDLM_LOCK_RELEASE(lock);
1667 
1668 	return rc;
1669 }
1670 
1671 /**
1672  * Process a call to glimpse AST callback for a lock in ast_work list
1673  */
ldlm_work_gl_ast_lock(struct ptlrpc_request_set * rqset,void * opaq)1674 static int ldlm_work_gl_ast_lock(struct ptlrpc_request_set *rqset, void *opaq)
1675 {
1676 	struct ldlm_cb_set_arg		*arg = opaq;
1677 	struct ldlm_glimpse_work	*gl_work;
1678 	struct ldlm_lock		*lock;
1679 	int				 rc = 0;
1680 
1681 	if (list_empty(arg->list))
1682 		return -ENOENT;
1683 
1684 	gl_work = list_entry(arg->list->next, struct ldlm_glimpse_work,
1685 				 gl_list);
1686 	list_del_init(&gl_work->gl_list);
1687 
1688 	lock = gl_work->gl_lock;
1689 
1690 	/* transfer the glimpse descriptor to ldlm_cb_set_arg */
1691 	arg->gl_desc = gl_work->gl_desc;
1692 
1693 	/* invoke the actual glimpse callback */
1694 	if (lock->l_glimpse_ast(lock, (void *)arg) == 0)
1695 		rc = 1;
1696 
1697 	LDLM_LOCK_RELEASE(lock);
1698 
1699 	if ((gl_work->gl_flags & LDLM_GL_WORK_NOFREE) == 0)
1700 		kfree(gl_work);
1701 
1702 	return rc;
1703 }
1704 
1705 /**
1706  * Process list of locks in need of ASTs being sent.
1707  *
1708  * Used on server to send multiple ASTs together instead of sending one by
1709  * one.
1710  */
ldlm_run_ast_work(struct ldlm_namespace * ns,struct list_head * rpc_list,enum ldlm_desc_ast_t ast_type)1711 int ldlm_run_ast_work(struct ldlm_namespace *ns, struct list_head *rpc_list,
1712 		      enum ldlm_desc_ast_t ast_type)
1713 {
1714 	struct ldlm_cb_set_arg *arg;
1715 	set_producer_func       work_ast_lock;
1716 	int		     rc;
1717 
1718 	if (list_empty(rpc_list))
1719 		return 0;
1720 
1721 	arg = kzalloc(sizeof(*arg), GFP_NOFS);
1722 	if (!arg)
1723 		return -ENOMEM;
1724 
1725 	atomic_set(&arg->restart, 0);
1726 	arg->list = rpc_list;
1727 
1728 	switch (ast_type) {
1729 	case LDLM_WORK_BL_AST:
1730 		arg->type = LDLM_BL_CALLBACK;
1731 		work_ast_lock = ldlm_work_bl_ast_lock;
1732 		break;
1733 	case LDLM_WORK_CP_AST:
1734 		arg->type = LDLM_CP_CALLBACK;
1735 		work_ast_lock = ldlm_work_cp_ast_lock;
1736 		break;
1737 	case LDLM_WORK_REVOKE_AST:
1738 		arg->type = LDLM_BL_CALLBACK;
1739 		work_ast_lock = ldlm_work_revoke_ast_lock;
1740 		break;
1741 	case LDLM_WORK_GL_AST:
1742 		arg->type = LDLM_GL_CALLBACK;
1743 		work_ast_lock = ldlm_work_gl_ast_lock;
1744 		break;
1745 	default:
1746 		LBUG();
1747 	}
1748 
1749 	/* We create a ptlrpc request set with flow control extension.
1750 	 * This request set will use the work_ast_lock function to produce new
1751 	 * requests and will send a new request each time one completes in order
1752 	 * to keep the number of requests in flight to ns_max_parallel_ast */
1753 	arg->set = ptlrpc_prep_fcset(ns->ns_max_parallel_ast ? : UINT_MAX,
1754 				     work_ast_lock, arg);
1755 	if (arg->set == NULL) {
1756 		rc = -ENOMEM;
1757 		goto out;
1758 	}
1759 
1760 	ptlrpc_set_wait(arg->set);
1761 	ptlrpc_set_destroy(arg->set);
1762 
1763 	rc = atomic_read(&arg->restart) ? -ERESTART : 0;
1764 	goto out;
1765 out:
1766 	kfree(arg);
1767 	return rc;
1768 }
1769 
1770 /**
1771  * Helper function to call blocking AST for LDLM lock \a lock in a
1772  * "cancelling" mode.
1773  */
ldlm_cancel_callback(struct ldlm_lock * lock)1774 void ldlm_cancel_callback(struct ldlm_lock *lock)
1775 {
1776 	check_res_locked(lock->l_resource);
1777 	if (!(lock->l_flags & LDLM_FL_CANCEL)) {
1778 		lock->l_flags |= LDLM_FL_CANCEL;
1779 		if (lock->l_blocking_ast) {
1780 			unlock_res_and_lock(lock);
1781 			lock->l_blocking_ast(lock, NULL, lock->l_ast_data,
1782 					     LDLM_CB_CANCELING);
1783 			lock_res_and_lock(lock);
1784 		} else {
1785 			LDLM_DEBUG(lock, "no blocking ast");
1786 		}
1787 	}
1788 	lock->l_flags |= LDLM_FL_BL_DONE;
1789 }
1790 
1791 /**
1792  * Remove skiplist-enabled LDLM lock \a req from granted list
1793  */
ldlm_unlink_lock_skiplist(struct ldlm_lock * req)1794 void ldlm_unlink_lock_skiplist(struct ldlm_lock *req)
1795 {
1796 	if (req->l_resource->lr_type != LDLM_PLAIN &&
1797 	    req->l_resource->lr_type != LDLM_IBITS)
1798 		return;
1799 
1800 	list_del_init(&req->l_sl_policy);
1801 	list_del_init(&req->l_sl_mode);
1802 }
1803 
1804 /**
1805  * Attempts to cancel LDLM lock \a lock that has no reader/writer references.
1806  */
ldlm_lock_cancel(struct ldlm_lock * lock)1807 void ldlm_lock_cancel(struct ldlm_lock *lock)
1808 {
1809 	struct ldlm_resource *res;
1810 	struct ldlm_namespace *ns;
1811 
1812 	lock_res_and_lock(lock);
1813 
1814 	res = lock->l_resource;
1815 	ns  = ldlm_res_to_ns(res);
1816 
1817 	/* Please do not, no matter how tempting, remove this LBUG without
1818 	 * talking to me first. -phik */
1819 	if (lock->l_readers || lock->l_writers) {
1820 		LDLM_ERROR(lock, "lock still has references");
1821 		LBUG();
1822 	}
1823 
1824 	/* Releases cancel callback. */
1825 	ldlm_cancel_callback(lock);
1826 
1827 	ldlm_resource_unlink_lock(lock);
1828 	ldlm_lock_destroy_nolock(lock);
1829 
1830 	if (lock->l_granted_mode == lock->l_req_mode)
1831 		ldlm_pool_del(&ns->ns_pool, lock);
1832 
1833 	/* Make sure we will not be called again for same lock what is possible
1834 	 * if not to zero out lock->l_granted_mode */
1835 	lock->l_granted_mode = LCK_MINMODE;
1836 	unlock_res_and_lock(lock);
1837 }
1838 EXPORT_SYMBOL(ldlm_lock_cancel);
1839 
1840 /**
1841  * Set opaque data into the lock that only makes sense to upper layer.
1842  */
ldlm_lock_set_data(struct lustre_handle * lockh,void * data)1843 int ldlm_lock_set_data(struct lustre_handle *lockh, void *data)
1844 {
1845 	struct ldlm_lock *lock = ldlm_handle2lock(lockh);
1846 	int rc = -EINVAL;
1847 
1848 	if (lock) {
1849 		if (lock->l_ast_data == NULL)
1850 			lock->l_ast_data = data;
1851 		if (lock->l_ast_data == data)
1852 			rc = 0;
1853 		LDLM_LOCK_PUT(lock);
1854 	}
1855 	return rc;
1856 }
1857 EXPORT_SYMBOL(ldlm_lock_set_data);
1858 
1859 struct export_cl_data {
1860 	struct obd_export	*ecl_exp;
1861 	int			ecl_loop;
1862 };
1863 
1864 /**
1865  * Print lock with lock handle \a lockh description into debug log.
1866  *
1867  * Used when printing all locks on a resource for debug purposes.
1868  */
ldlm_lock_dump_handle(int level,struct lustre_handle * lockh)1869 void ldlm_lock_dump_handle(int level, struct lustre_handle *lockh)
1870 {
1871 	struct ldlm_lock *lock;
1872 
1873 	if (!((libcfs_debug | D_ERROR) & level))
1874 		return;
1875 
1876 	lock = ldlm_handle2lock(lockh);
1877 	if (lock == NULL)
1878 		return;
1879 
1880 	LDLM_DEBUG_LIMIT(level, lock, "###");
1881 
1882 	LDLM_LOCK_PUT(lock);
1883 }
1884 EXPORT_SYMBOL(ldlm_lock_dump_handle);
1885 
1886 /**
1887  * Print lock information with custom message into debug log.
1888  * Helper function.
1889  */
_ldlm_lock_debug(struct ldlm_lock * lock,struct libcfs_debug_msg_data * msgdata,const char * fmt,...)1890 void _ldlm_lock_debug(struct ldlm_lock *lock,
1891 		      struct libcfs_debug_msg_data *msgdata,
1892 		      const char *fmt, ...)
1893 {
1894 	va_list args;
1895 	struct obd_export *exp = lock->l_export;
1896 	struct ldlm_resource *resource = lock->l_resource;
1897 	char *nid = "local";
1898 
1899 	va_start(args, fmt);
1900 
1901 	if (exp && exp->exp_connection) {
1902 		nid = libcfs_nid2str(exp->exp_connection->c_peer.nid);
1903 	} else if (exp && exp->exp_obd != NULL) {
1904 		struct obd_import *imp = exp->exp_obd->u.cli.cl_import;
1905 
1906 		nid = libcfs_nid2str(imp->imp_connection->c_peer.nid);
1907 	}
1908 
1909 	if (resource == NULL) {
1910 		libcfs_debug_vmsg2(msgdata, fmt, args,
1911 				   " ns: \?\? lock: %p/%#llx lrc: %d/%d,%d mode: %s/%s res: \?\? rrc=\?\? type: \?\?\? flags: %#llx nid: %s remote: %#llx expref: %d pid: %u timeout: %lu lvb_type: %d\n",
1912 				   lock,
1913 				   lock->l_handle.h_cookie, atomic_read(&lock->l_refc),
1914 				   lock->l_readers, lock->l_writers,
1915 				   ldlm_lockname[lock->l_granted_mode],
1916 				   ldlm_lockname[lock->l_req_mode],
1917 				   lock->l_flags, nid, lock->l_remote_handle.cookie,
1918 				   exp ? atomic_read(&exp->exp_refcount) : -99,
1919 				   lock->l_pid, lock->l_callback_timeout, lock->l_lvb_type);
1920 		va_end(args);
1921 		return;
1922 	}
1923 
1924 	switch (resource->lr_type) {
1925 	case LDLM_EXTENT:
1926 		libcfs_debug_vmsg2(msgdata, fmt, args,
1927 				   " ns: %s lock: %p/%#llx lrc: %d/%d,%d mode: %s/%s res: " DLDLMRES " rrc: %d type: %s [%llu->%llu] (req %llu->%llu) flags: %#llx nid: %s remote: %#llx expref: %d pid: %u timeout: %lu lvb_type: %d\n",
1928 				   ldlm_lock_to_ns_name(lock), lock,
1929 				   lock->l_handle.h_cookie, atomic_read(&lock->l_refc),
1930 				   lock->l_readers, lock->l_writers,
1931 				   ldlm_lockname[lock->l_granted_mode],
1932 				   ldlm_lockname[lock->l_req_mode],
1933 				   PLDLMRES(resource),
1934 				   atomic_read(&resource->lr_refcount),
1935 				   ldlm_typename[resource->lr_type],
1936 				   lock->l_policy_data.l_extent.start,
1937 				   lock->l_policy_data.l_extent.end,
1938 				   lock->l_req_extent.start, lock->l_req_extent.end,
1939 				   lock->l_flags, nid, lock->l_remote_handle.cookie,
1940 				   exp ? atomic_read(&exp->exp_refcount) : -99,
1941 				   lock->l_pid, lock->l_callback_timeout,
1942 				   lock->l_lvb_type);
1943 		break;
1944 
1945 	case LDLM_FLOCK:
1946 		libcfs_debug_vmsg2(msgdata, fmt, args,
1947 				   " ns: %s lock: %p/%#llx lrc: %d/%d,%d mode: %s/%s res: " DLDLMRES " rrc: %d type: %s pid: %d [%llu->%llu] flags: %#llx nid: %s remote: %#llx expref: %d pid: %u timeout: %lu\n",
1948 				   ldlm_lock_to_ns_name(lock), lock,
1949 				   lock->l_handle.h_cookie, atomic_read(&lock->l_refc),
1950 				   lock->l_readers, lock->l_writers,
1951 				   ldlm_lockname[lock->l_granted_mode],
1952 				   ldlm_lockname[lock->l_req_mode],
1953 				   PLDLMRES(resource),
1954 				   atomic_read(&resource->lr_refcount),
1955 				   ldlm_typename[resource->lr_type],
1956 				   lock->l_policy_data.l_flock.pid,
1957 				   lock->l_policy_data.l_flock.start,
1958 				   lock->l_policy_data.l_flock.end,
1959 				   lock->l_flags, nid, lock->l_remote_handle.cookie,
1960 				   exp ? atomic_read(&exp->exp_refcount) : -99,
1961 				   lock->l_pid, lock->l_callback_timeout);
1962 		break;
1963 
1964 	case LDLM_IBITS:
1965 		libcfs_debug_vmsg2(msgdata, fmt, args,
1966 				   " ns: %s lock: %p/%#llx lrc: %d/%d,%d mode: %s/%s res: " DLDLMRES " bits %#llx rrc: %d type: %s flags: %#llx nid: %s remote: %#llx expref: %d pid: %u timeout: %lu lvb_type: %d\n",
1967 				   ldlm_lock_to_ns_name(lock),
1968 				   lock, lock->l_handle.h_cookie,
1969 				   atomic_read(&lock->l_refc),
1970 				   lock->l_readers, lock->l_writers,
1971 				   ldlm_lockname[lock->l_granted_mode],
1972 				   ldlm_lockname[lock->l_req_mode],
1973 				   PLDLMRES(resource),
1974 				   lock->l_policy_data.l_inodebits.bits,
1975 				   atomic_read(&resource->lr_refcount),
1976 				   ldlm_typename[resource->lr_type],
1977 				   lock->l_flags, nid, lock->l_remote_handle.cookie,
1978 				   exp ? atomic_read(&exp->exp_refcount) : -99,
1979 				   lock->l_pid, lock->l_callback_timeout,
1980 				   lock->l_lvb_type);
1981 		break;
1982 
1983 	default:
1984 		libcfs_debug_vmsg2(msgdata, fmt, args,
1985 				   " ns: %s lock: %p/%#llx lrc: %d/%d,%d mode: %s/%s res: " DLDLMRES " rrc: %d type: %s flags: %#llx nid: %s remote: %#llx expref: %d pid: %u timeout: %lu lvb_type: %d\n",
1986 				   ldlm_lock_to_ns_name(lock),
1987 				   lock, lock->l_handle.h_cookie,
1988 				   atomic_read(&lock->l_refc),
1989 				   lock->l_readers, lock->l_writers,
1990 				   ldlm_lockname[lock->l_granted_mode],
1991 				   ldlm_lockname[lock->l_req_mode],
1992 				   PLDLMRES(resource),
1993 				   atomic_read(&resource->lr_refcount),
1994 				   ldlm_typename[resource->lr_type],
1995 				   lock->l_flags, nid, lock->l_remote_handle.cookie,
1996 				   exp ? atomic_read(&exp->exp_refcount) : -99,
1997 				   lock->l_pid, lock->l_callback_timeout,
1998 				   lock->l_lvb_type);
1999 		break;
2000 	}
2001 	va_end(args);
2002 }
2003 EXPORT_SYMBOL(_ldlm_lock_debug);
2004