File locking changes for v4.21

-----BEGIN PGP SIGNATURE-----
 
 iQIcBAABAgAGBQJcILryAAoJEAAOaEEZVoIVByMP/RYty0dsV9ALt0PKqxKyDVT7
 9KOGA73JIahpeO2dnlIiZAXdeC3Y350UH2axrX6Xy/X6ktTCca3X/xqZMn/wK5kt
 zeMeqcjsyTz4wJoOCWUm7nsteMALfusDAIMd8axEnBFgWk9nsQwgh+jS1gYVj2D1
 GUSdCceKcQ0ZOSsZDzDFgd/R34dNMobvYd1aOE2bgHL19BAXj1aKIv81yAjjY41A
 D+VVvEyzIHQUtxmWk1X3X8kYfhHMu4X5AQhhqPxw8jw8CC0w0lfQTOZe/ApeMfxZ
 BFhusMdwf8QhkGWMOfhOTldTm3GobBmdsNX5HmukvcAEjDVPiOLCiKXaLWEBJ68r
 HbmB3YyxzT2re0PfSa72WIu6W8aKZHUny+BLgTHiuW3KIV1khJK4AflWKMLfe8yi
 0xUWm0SeiwMCdBLtkD8IykC19LBCAKM15JBxpUHadBvBsO9G+54DfzRImjnxSjAH
 tX0RnFWmA7hXt02fZjcywT+/+n84kt0lbjdJAKXK6tl0DbGxlEj8YoJVBNG/p94q
 ARHgBKMFTrsDPJiMY5WSobHapjmnSNDBk6uSf6TPe2E5wmnhLcwfTqwCdnpocW6c
 A7CX+q/Jfyk1oNEGajXXyIsjaDc2Ma0Fs/mfb3o5Lhkjq68e+LT0+eIjn4veuY5H
 KoZ/KVBGs4Uxy81qMPkl
 =sUSp
 -----END PGP SIGNATURE-----

Merge tag 'locks-v4.21-1' of git://git.kernel.org/pub/scm/linux/kernel/git/jlayton/linux

Pull file locking updates from Jeff Layton:
 "The main change in this set is Neil Brown's work to reduce the
  thundering herd problem when a heavily-contended file lock is
  released.

  Previously we'd always wake up all waiters when this occurred. With
  this set, we'll now we only wake up waiters that were blocked on the
  range being released"

* tag 'locks-v4.21-1' of git://git.kernel.org/pub/scm/linux/kernel/git/jlayton/linux:
  locks: Use inode_is_open_for_write
  fs/locks: remove unnecessary white space.
  fs/locks: merge posix_unblock_lock() and locks_delete_block()
  fs/locks: create a tree of dependent requests.
  fs/locks: change all *_conflict() functions to return bool.
  fs/locks: always delete_block after waiting.
  fs/locks: allow a lock request to block other requests.
  fs/locks: use properly initialized file_lock when unlocking.
  ocfs2: properly initial file_lock used for unlock.
  gfs2: properly initial file_lock used for unlock.
  NFS: use locks_copy_lock() to copy locks.
  fs/locks: split out __locks_wake_up_blocks().
  fs/locks: rename some lists and pointers.
This commit is contained in:
Linus Torvalds 2018-12-27 17:12:30 -08:00
commit 00c569b567
9 changed files with 253 additions and 158 deletions

View File

@ -1103,10 +1103,10 @@ try_again:
rc = posix_lock_file(file, flock, NULL); rc = posix_lock_file(file, flock, NULL);
up_write(&cinode->lock_sem); up_write(&cinode->lock_sem);
if (rc == FILE_LOCK_DEFERRED) { if (rc == FILE_LOCK_DEFERRED) {
rc = wait_event_interruptible(flock->fl_wait, !flock->fl_next); rc = wait_event_interruptible(flock->fl_wait, !flock->fl_blocker);
if (!rc) if (!rc)
goto try_again; goto try_again;
posix_unblock_lock(flock); locks_delete_block(flock);
} }
return rc; return rc;
} }

View File

@ -1199,13 +1199,13 @@ static int do_flock(struct file *file, int cmd, struct file_lock *fl)
mutex_lock(&fp->f_fl_mutex); mutex_lock(&fp->f_fl_mutex);
if (gfs2_holder_initialized(fl_gh)) { if (gfs2_holder_initialized(fl_gh)) {
struct file_lock request;
if (fl_gh->gh_state == state) if (fl_gh->gh_state == state)
goto out; goto out;
locks_lock_file_wait(file, locks_init_lock(&request);
&(struct file_lock) { request.fl_type = F_UNLCK;
.fl_type = F_UNLCK, request.fl_flags = FL_FLOCK;
.fl_flags = FL_FLOCK locks_lock_file_wait(file, &request);
});
gfs2_glock_dq(fl_gh); gfs2_glock_dq(fl_gh);
gfs2_holder_reinit(state, flags, fl_gh); gfs2_holder_reinit(state, flags, fl_gh);
} else { } else {

View File

@ -276,7 +276,7 @@ static int nlmsvc_unlink_block(struct nlm_block *block)
dprintk("lockd: unlinking block %p...\n", block); dprintk("lockd: unlinking block %p...\n", block);
/* Remove block from list */ /* Remove block from list */
status = posix_unblock_lock(&block->b_call->a_args.lock.fl); status = locks_delete_block(&block->b_call->a_args.lock.fl);
nlmsvc_remove_block(block); nlmsvc_remove_block(block);
return status; return status;
} }

View File

@ -112,6 +112,46 @@
* Leases and LOCK_MAND * Leases and LOCK_MAND
* Matthew Wilcox <willy@debian.org>, June, 2000. * Matthew Wilcox <willy@debian.org>, June, 2000.
* Stephen Rothwell <sfr@canb.auug.org.au>, June, 2000. * Stephen Rothwell <sfr@canb.auug.org.au>, June, 2000.
*
* Locking conflicts and dependencies:
* If multiple threads attempt to lock the same byte (or flock the same file)
* only one can be granted the lock, and other must wait their turn.
* The first lock has been "applied" or "granted", the others are "waiting"
* and are "blocked" by the "applied" lock..
*
* Waiting and applied locks are all kept in trees whose properties are:
*
* - the root of a tree may be an applied or waiting lock.
* - every other node in the tree is a waiting lock that
* conflicts with every ancestor of that node.
*
* Every such tree begins life as a waiting singleton which obviously
* satisfies the above properties.
*
* The only ways we modify trees preserve these properties:
*
* 1. We may add a new leaf node, but only after first verifying that it
* conflicts with all of its ancestors.
* 2. We may remove the root of a tree, creating a new singleton
* tree from the root and N new trees rooted in the immediate
* children.
* 3. If the root of a tree is not currently an applied lock, we may
* apply it (if possible).
* 4. We may upgrade the root of the tree (either extend its range,
* or upgrade its entire range from read to write).
*
* When an applied lock is modified in a way that reduces or downgrades any
* part of its range, we remove all its children (2 above). This particularly
* happens when a lock is unlocked.
*
* For each of those child trees we "wake up" the thread which is
* waiting for the lock so it can continue handling as follows: if the
* root of the tree applies, we do so (3). If it doesn't, it must
* conflict with some applied lock. We remove (wake up) all of its children
* (2), and add it is a new leaf to the tree rooted in the applied
* lock (1). We then repeat the process recursively with those
* children.
*
*/ */
#include <linux/capability.h> #include <linux/capability.h>
@ -189,9 +229,9 @@ static DEFINE_HASHTABLE(blocked_hash, BLOCKED_HASH_BITS);
* This lock protects the blocked_hash. Generally, if you're accessing it, you * This lock protects the blocked_hash. Generally, if you're accessing it, you
* want to be holding this lock. * want to be holding this lock.
* *
* In addition, it also protects the fl->fl_block list, and the fl->fl_next * In addition, it also protects the fl->fl_blocked_requests list, and the
* pointer for file_lock structures that are acting as lock requests (in * fl->fl_blocker pointer for file_lock structures that are acting as lock
* contrast to those that are acting as records of acquired locks). * requests (in contrast to those that are acting as records of acquired locks).
* *
* Note that when we acquire this lock in order to change the above fields, * Note that when we acquire this lock in order to change the above fields,
* we often hold the flc_lock as well. In certain cases, when reading the fields * we often hold the flc_lock as well. In certain cases, when reading the fields
@ -293,7 +333,8 @@ static void locks_init_lock_heads(struct file_lock *fl)
{ {
INIT_HLIST_NODE(&fl->fl_link); INIT_HLIST_NODE(&fl->fl_link);
INIT_LIST_HEAD(&fl->fl_list); INIT_LIST_HEAD(&fl->fl_list);
INIT_LIST_HEAD(&fl->fl_block); INIT_LIST_HEAD(&fl->fl_blocked_requests);
INIT_LIST_HEAD(&fl->fl_blocked_member);
init_waitqueue_head(&fl->fl_wait); init_waitqueue_head(&fl->fl_wait);
} }
@ -332,7 +373,8 @@ void locks_free_lock(struct file_lock *fl)
{ {
BUG_ON(waitqueue_active(&fl->fl_wait)); BUG_ON(waitqueue_active(&fl->fl_wait));
BUG_ON(!list_empty(&fl->fl_list)); BUG_ON(!list_empty(&fl->fl_list));
BUG_ON(!list_empty(&fl->fl_block)); BUG_ON(!list_empty(&fl->fl_blocked_requests));
BUG_ON(!list_empty(&fl->fl_blocked_member));
BUG_ON(!hlist_unhashed(&fl->fl_link)); BUG_ON(!hlist_unhashed(&fl->fl_link));
locks_release_private(fl); locks_release_private(fl);
@ -357,7 +399,6 @@ void locks_init_lock(struct file_lock *fl)
memset(fl, 0, sizeof(struct file_lock)); memset(fl, 0, sizeof(struct file_lock));
locks_init_lock_heads(fl); locks_init_lock_heads(fl);
} }
EXPORT_SYMBOL(locks_init_lock); EXPORT_SYMBOL(locks_init_lock);
/* /*
@ -397,9 +438,26 @@ void locks_copy_lock(struct file_lock *new, struct file_lock *fl)
fl->fl_ops->fl_copy_lock(new, fl); fl->fl_ops->fl_copy_lock(new, fl);
} }
} }
EXPORT_SYMBOL(locks_copy_lock); EXPORT_SYMBOL(locks_copy_lock);
static void locks_move_blocks(struct file_lock *new, struct file_lock *fl)
{
struct file_lock *f;
/*
* As ctx->flc_lock is held, new requests cannot be added to
* ->fl_blocked_requests, so we don't need a lock to check if it
* is empty.
*/
if (list_empty(&fl->fl_blocked_requests))
return;
spin_lock(&blocked_lock_lock);
list_splice_init(&fl->fl_blocked_requests, &new->fl_blocked_requests);
list_for_each_entry(f, &fl->fl_blocked_requests, fl_blocked_member)
f->fl_blocker = new;
spin_unlock(&blocked_lock_lock);
}
static inline int flock_translate_cmd(int cmd) { static inline int flock_translate_cmd(int cmd) {
if (cmd & LOCK_MAND) if (cmd & LOCK_MAND)
return cmd & (LOCK_MAND | LOCK_RW); return cmd & (LOCK_MAND | LOCK_RW);
@ -416,17 +474,20 @@ static inline int flock_translate_cmd(int cmd) {
/* Fill in a file_lock structure with an appropriate FLOCK lock. */ /* Fill in a file_lock structure with an appropriate FLOCK lock. */
static struct file_lock * static struct file_lock *
flock_make_lock(struct file *filp, unsigned int cmd) flock_make_lock(struct file *filp, unsigned int cmd, struct file_lock *fl)
{ {
struct file_lock *fl;
int type = flock_translate_cmd(cmd); int type = flock_translate_cmd(cmd);
if (type < 0) if (type < 0)
return ERR_PTR(type); return ERR_PTR(type);
if (fl == NULL) {
fl = locks_alloc_lock(); fl = locks_alloc_lock();
if (fl == NULL) if (fl == NULL)
return ERR_PTR(-ENOMEM); return ERR_PTR(-ENOMEM);
} else {
locks_init_lock(fl);
}
fl->fl_file = filp; fl->fl_file = filp;
fl->fl_owner = filp; fl->fl_owner = filp;
@ -666,16 +727,58 @@ static void locks_delete_global_blocked(struct file_lock *waiter)
static void __locks_delete_block(struct file_lock *waiter) static void __locks_delete_block(struct file_lock *waiter)
{ {
locks_delete_global_blocked(waiter); locks_delete_global_blocked(waiter);
list_del_init(&waiter->fl_block); list_del_init(&waiter->fl_blocked_member);
waiter->fl_next = NULL; waiter->fl_blocker = NULL;
} }
static void locks_delete_block(struct file_lock *waiter) static void __locks_wake_up_blocks(struct file_lock *blocker)
{ {
while (!list_empty(&blocker->fl_blocked_requests)) {
struct file_lock *waiter;
waiter = list_first_entry(&blocker->fl_blocked_requests,
struct file_lock, fl_blocked_member);
__locks_delete_block(waiter);
if (waiter->fl_lmops && waiter->fl_lmops->lm_notify)
waiter->fl_lmops->lm_notify(waiter);
else
wake_up(&waiter->fl_wait);
}
}
/**
* locks_delete_lock - stop waiting for a file lock
* @waiter: the lock which was waiting
*
* lockd/nfsd need to disconnect the lock while working on it.
*/
int locks_delete_block(struct file_lock *waiter)
{
int status = -ENOENT;
/*
* If fl_blocker is NULL, it won't be set again as this thread
* "owns" the lock and is the only one that might try to claim
* the lock. So it is safe to test fl_blocker locklessly.
* Also if fl_blocker is NULL, this waiter is not listed on
* fl_blocked_requests for some lock, so no other request can
* be added to the list of fl_blocked_requests for this
* request. So if fl_blocker is NULL, it is safe to
* locklessly check if fl_blocked_requests is empty. If both
* of these checks succeed, there is no need to take the lock.
*/
if (waiter->fl_blocker == NULL &&
list_empty(&waiter->fl_blocked_requests))
return status;
spin_lock(&blocked_lock_lock); spin_lock(&blocked_lock_lock);
if (waiter->fl_blocker)
status = 0;
__locks_wake_up_blocks(waiter);
__locks_delete_block(waiter); __locks_delete_block(waiter);
spin_unlock(&blocked_lock_lock); spin_unlock(&blocked_lock_lock);
return status;
} }
EXPORT_SYMBOL(locks_delete_block);
/* Insert waiter into blocker's block list. /* Insert waiter into blocker's block list.
* We use a circular list so that processes can be easily woken up in * We use a circular list so that processes can be easily woken up in
@ -683,26 +786,49 @@ static void locks_delete_block(struct file_lock *waiter)
* it seems like the reasonable thing to do. * it seems like the reasonable thing to do.
* *
* Must be called with both the flc_lock and blocked_lock_lock held. The * Must be called with both the flc_lock and blocked_lock_lock held. The
* fl_block list itself is protected by the blocked_lock_lock, but by ensuring * fl_blocked_requests list itself is protected by the blocked_lock_lock,
* that the flc_lock is also held on insertions we can avoid taking the * but by ensuring that the flc_lock is also held on insertions we can avoid
* blocked_lock_lock in some cases when we see that the fl_block list is empty. * taking the blocked_lock_lock in some cases when we see that the
* fl_blocked_requests list is empty.
*
* Rather than just adding to the list, we check for conflicts with any existing
* waiters, and add beneath any waiter that blocks the new waiter.
* Thus wakeups don't happen until needed.
*/ */
static void __locks_insert_block(struct file_lock *blocker, static void __locks_insert_block(struct file_lock *blocker,
struct file_lock *waiter) struct file_lock *waiter,
bool conflict(struct file_lock *,
struct file_lock *))
{ {
BUG_ON(!list_empty(&waiter->fl_block)); struct file_lock *fl;
waiter->fl_next = blocker; BUG_ON(!list_empty(&waiter->fl_blocked_member));
list_add_tail(&waiter->fl_block, &blocker->fl_block);
new_blocker:
list_for_each_entry(fl, &blocker->fl_blocked_requests, fl_blocked_member)
if (conflict(fl, waiter)) {
blocker = fl;
goto new_blocker;
}
waiter->fl_blocker = blocker;
list_add_tail(&waiter->fl_blocked_member, &blocker->fl_blocked_requests);
if (IS_POSIX(blocker) && !IS_OFDLCK(blocker)) if (IS_POSIX(blocker) && !IS_OFDLCK(blocker))
locks_insert_global_blocked(waiter); locks_insert_global_blocked(waiter);
/* The requests in waiter->fl_blocked are known to conflict with
* waiter, but might not conflict with blocker, or the requests
* and lock which block it. So they all need to be woken.
*/
__locks_wake_up_blocks(waiter);
} }
/* Must be called with flc_lock held. */ /* Must be called with flc_lock held. */
static void locks_insert_block(struct file_lock *blocker, static void locks_insert_block(struct file_lock *blocker,
struct file_lock *waiter) struct file_lock *waiter,
bool conflict(struct file_lock *,
struct file_lock *))
{ {
spin_lock(&blocked_lock_lock); spin_lock(&blocked_lock_lock);
__locks_insert_block(blocker, waiter); __locks_insert_block(blocker, waiter, conflict);
spin_unlock(&blocked_lock_lock); spin_unlock(&blocked_lock_lock);
} }
@ -716,25 +842,15 @@ static void locks_wake_up_blocks(struct file_lock *blocker)
/* /*
* Avoid taking global lock if list is empty. This is safe since new * Avoid taking global lock if list is empty. This is safe since new
* blocked requests are only added to the list under the flc_lock, and * blocked requests are only added to the list under the flc_lock, and
* the flc_lock is always held here. Note that removal from the fl_block * the flc_lock is always held here. Note that removal from the
* list does not require the flc_lock, so we must recheck list_empty() * fl_blocked_requests list does not require the flc_lock, so we must
* after acquiring the blocked_lock_lock. * recheck list_empty() after acquiring the blocked_lock_lock.
*/ */
if (list_empty(&blocker->fl_block)) if (list_empty(&blocker->fl_blocked_requests))
return; return;
spin_lock(&blocked_lock_lock); spin_lock(&blocked_lock_lock);
while (!list_empty(&blocker->fl_block)) { __locks_wake_up_blocks(blocker);
struct file_lock *waiter;
waiter = list_first_entry(&blocker->fl_block,
struct file_lock, fl_block);
__locks_delete_block(waiter);
if (waiter->fl_lmops && waiter->fl_lmops->lm_notify)
waiter->fl_lmops->lm_notify(waiter);
else
wake_up(&waiter->fl_wait);
}
spin_unlock(&blocked_lock_lock); spin_unlock(&blocked_lock_lock);
} }
@ -766,47 +882,50 @@ locks_delete_lock_ctx(struct file_lock *fl, struct list_head *dispose)
/* Determine if lock sys_fl blocks lock caller_fl. Common functionality /* Determine if lock sys_fl blocks lock caller_fl. Common functionality
* checks for shared/exclusive status of overlapping locks. * checks for shared/exclusive status of overlapping locks.
*/ */
static int locks_conflict(struct file_lock *caller_fl, struct file_lock *sys_fl) static bool locks_conflict(struct file_lock *caller_fl,
struct file_lock *sys_fl)
{ {
if (sys_fl->fl_type == F_WRLCK) if (sys_fl->fl_type == F_WRLCK)
return 1; return true;
if (caller_fl->fl_type == F_WRLCK) if (caller_fl->fl_type == F_WRLCK)
return 1; return true;
return 0; return false;
} }
/* Determine if lock sys_fl blocks lock caller_fl. POSIX specific /* Determine if lock sys_fl blocks lock caller_fl. POSIX specific
* checking before calling the locks_conflict(). * checking before calling the locks_conflict().
*/ */
static int posix_locks_conflict(struct file_lock *caller_fl, struct file_lock *sys_fl) static bool posix_locks_conflict(struct file_lock *caller_fl,
struct file_lock *sys_fl)
{ {
/* POSIX locks owned by the same process do not conflict with /* POSIX locks owned by the same process do not conflict with
* each other. * each other.
*/ */
if (posix_same_owner(caller_fl, sys_fl)) if (posix_same_owner(caller_fl, sys_fl))
return (0); return false;
/* Check whether they overlap */ /* Check whether they overlap */
if (!locks_overlap(caller_fl, sys_fl)) if (!locks_overlap(caller_fl, sys_fl))
return 0; return false;
return (locks_conflict(caller_fl, sys_fl)); return locks_conflict(caller_fl, sys_fl);
} }
/* Determine if lock sys_fl blocks lock caller_fl. FLOCK specific /* Determine if lock sys_fl blocks lock caller_fl. FLOCK specific
* checking before calling the locks_conflict(). * checking before calling the locks_conflict().
*/ */
static int flock_locks_conflict(struct file_lock *caller_fl, struct file_lock *sys_fl) static bool flock_locks_conflict(struct file_lock *caller_fl,
struct file_lock *sys_fl)
{ {
/* FLOCK locks referring to the same filp do not conflict with /* FLOCK locks referring to the same filp do not conflict with
* each other. * each other.
*/ */
if (caller_fl->fl_file == sys_fl->fl_file) if (caller_fl->fl_file == sys_fl->fl_file)
return (0); return false;
if ((caller_fl->fl_type & LOCK_MAND) || (sys_fl->fl_type & LOCK_MAND)) if ((caller_fl->fl_type & LOCK_MAND) || (sys_fl->fl_type & LOCK_MAND))
return 0; return false;
return (locks_conflict(caller_fl, sys_fl)); return locks_conflict(caller_fl, sys_fl);
} }
void void
@ -877,8 +996,11 @@ static struct file_lock *what_owner_is_waiting_for(struct file_lock *block_fl)
struct file_lock *fl; struct file_lock *fl;
hash_for_each_possible(blocked_hash, fl, fl_link, posix_owner_key(block_fl)) { hash_for_each_possible(blocked_hash, fl, fl_link, posix_owner_key(block_fl)) {
if (posix_same_owner(fl, block_fl)) if (posix_same_owner(fl, block_fl)) {
return fl->fl_next; while (fl->fl_blocker)
fl = fl->fl_blocker;
return fl;
}
} }
return NULL; return NULL;
} }
@ -965,12 +1087,13 @@ find_conflict:
if (!(request->fl_flags & FL_SLEEP)) if (!(request->fl_flags & FL_SLEEP))
goto out; goto out;
error = FILE_LOCK_DEFERRED; error = FILE_LOCK_DEFERRED;
locks_insert_block(fl, request); locks_insert_block(fl, request, flock_locks_conflict);
goto out; goto out;
} }
if (request->fl_flags & FL_ACCESS) if (request->fl_flags & FL_ACCESS)
goto out; goto out;
locks_copy_lock(new_fl, request); locks_copy_lock(new_fl, request);
locks_move_blocks(new_fl, request);
locks_insert_lock_ctx(new_fl, &ctx->flc_flock); locks_insert_lock_ctx(new_fl, &ctx->flc_flock);
new_fl = NULL; new_fl = NULL;
error = 0; error = 0;
@ -1039,7 +1162,8 @@ static int posix_lock_inode(struct inode *inode, struct file_lock *request,
spin_lock(&blocked_lock_lock); spin_lock(&blocked_lock_lock);
if (likely(!posix_locks_deadlock(request, fl))) { if (likely(!posix_locks_deadlock(request, fl))) {
error = FILE_LOCK_DEFERRED; error = FILE_LOCK_DEFERRED;
__locks_insert_block(fl, request); __locks_insert_block(fl, request,
posix_locks_conflict);
} }
spin_unlock(&blocked_lock_lock); spin_unlock(&blocked_lock_lock);
goto out; goto out;
@ -1164,6 +1288,7 @@ static int posix_lock_inode(struct inode *inode, struct file_lock *request,
goto out; goto out;
} }
locks_copy_lock(new_fl, request); locks_copy_lock(new_fl, request);
locks_move_blocks(new_fl, request);
locks_insert_lock_ctx(new_fl, &fl->fl_list); locks_insert_lock_ctx(new_fl, &fl->fl_list);
fl = new_fl; fl = new_fl;
new_fl = NULL; new_fl = NULL;
@ -1237,13 +1362,11 @@ static int posix_lock_inode_wait(struct inode *inode, struct file_lock *fl)
error = posix_lock_inode(inode, fl, NULL); error = posix_lock_inode(inode, fl, NULL);
if (error != FILE_LOCK_DEFERRED) if (error != FILE_LOCK_DEFERRED)
break; break;
error = wait_event_interruptible(fl->fl_wait, !fl->fl_next); error = wait_event_interruptible(fl->fl_wait, !fl->fl_blocker);
if (!error) if (error)
continue;
locks_delete_block(fl);
break; break;
} }
locks_delete_block(fl);
return error; return error;
} }
@ -1324,7 +1447,7 @@ int locks_mandatory_area(struct inode *inode, struct file *filp, loff_t start,
error = posix_lock_inode(inode, &fl, NULL); error = posix_lock_inode(inode, &fl, NULL);
if (error != FILE_LOCK_DEFERRED) if (error != FILE_LOCK_DEFERRED)
break; break;
error = wait_event_interruptible(fl.fl_wait, !fl.fl_next); error = wait_event_interruptible(fl.fl_wait, !fl.fl_blocker);
if (!error) { if (!error) {
/* /*
* If we've been sleeping someone might have * If we've been sleeping someone might have
@ -1334,13 +1457,12 @@ int locks_mandatory_area(struct inode *inode, struct file *filp, loff_t start,
continue; continue;
} }
locks_delete_block(&fl);
break; break;
} }
locks_delete_block(&fl);
return error; return error;
} }
EXPORT_SYMBOL(locks_mandatory_area); EXPORT_SYMBOL(locks_mandatory_area);
#endif /* CONFIG_MANDATORY_FILE_LOCKING */ #endif /* CONFIG_MANDATORY_FILE_LOCKING */
@ -1511,14 +1633,14 @@ restart:
break_time -= jiffies; break_time -= jiffies;
if (break_time == 0) if (break_time == 0)
break_time++; break_time++;
locks_insert_block(fl, new_fl); locks_insert_block(fl, new_fl, leases_conflict);
trace_break_lease_block(inode, new_fl); trace_break_lease_block(inode, new_fl);
spin_unlock(&ctx->flc_lock); spin_unlock(&ctx->flc_lock);
percpu_up_read_preempt_enable(&file_rwsem); percpu_up_read_preempt_enable(&file_rwsem);
locks_dispose_list(&dispose); locks_dispose_list(&dispose);
error = wait_event_interruptible_timeout(new_fl->fl_wait, error = wait_event_interruptible_timeout(new_fl->fl_wait,
!new_fl->fl_next, break_time); !new_fl->fl_blocker, break_time);
percpu_down_read_preempt_disable(&file_rwsem); percpu_down_read_preempt_disable(&file_rwsem);
spin_lock(&ctx->flc_lock); spin_lock(&ctx->flc_lock);
@ -1542,7 +1664,6 @@ out:
locks_free_lock(new_fl); locks_free_lock(new_fl);
return error; return error;
} }
EXPORT_SYMBOL(__break_lease); EXPORT_SYMBOL(__break_lease);
/** /**
@ -1573,7 +1694,6 @@ void lease_get_mtime(struct inode *inode, struct timespec64 *time)
if (has_lease) if (has_lease)
*time = current_time(inode); *time = current_time(inode);
} }
EXPORT_SYMBOL(lease_get_mtime); EXPORT_SYMBOL(lease_get_mtime);
/** /**
@ -1646,7 +1766,7 @@ check_conflicting_open(const struct dentry *dentry, const long arg, int flags)
if (flags & FL_LAYOUT) if (flags & FL_LAYOUT)
return 0; return 0;
if ((arg == F_RDLCK) && (atomic_read(&inode->i_writecount) > 0)) if ((arg == F_RDLCK) && inode_is_open_for_write(inode))
return -EAGAIN; return -EAGAIN;
if ((arg == F_WRLCK) && ((d_count(dentry) > 1) || if ((arg == F_WRLCK) && ((d_count(dentry) > 1) ||
@ -1931,13 +2051,11 @@ static int flock_lock_inode_wait(struct inode *inode, struct file_lock *fl)
error = flock_lock_inode(inode, fl); error = flock_lock_inode(inode, fl);
if (error != FILE_LOCK_DEFERRED) if (error != FILE_LOCK_DEFERRED)
break; break;
error = wait_event_interruptible(fl->fl_wait, !fl->fl_next); error = wait_event_interruptible(fl->fl_wait, !fl->fl_blocker);
if (!error) if (error)
continue;
locks_delete_block(fl);
break; break;
} }
locks_delete_block(fl);
return error; return error;
} }
@ -2001,7 +2119,7 @@ SYSCALL_DEFINE2(flock, unsigned int, fd, unsigned int, cmd)
!(f.file->f_mode & (FMODE_READ|FMODE_WRITE))) !(f.file->f_mode & (FMODE_READ|FMODE_WRITE)))
goto out_putf; goto out_putf;
lock = flock_make_lock(f.file, cmd); lock = flock_make_lock(f.file, cmd, NULL);
if (IS_ERR(lock)) { if (IS_ERR(lock)) {
error = PTR_ERR(lock); error = PTR_ERR(lock);
goto out_putf; goto out_putf;
@ -2210,13 +2328,11 @@ static int do_lock_file_wait(struct file *filp, unsigned int cmd,
error = vfs_lock_file(filp, cmd, fl, NULL); error = vfs_lock_file(filp, cmd, fl, NULL);
if (error != FILE_LOCK_DEFERRED) if (error != FILE_LOCK_DEFERRED)
break; break;
error = wait_event_interruptible(fl->fl_wait, !fl->fl_next); error = wait_event_interruptible(fl->fl_wait, !fl->fl_blocker);
if (!error) if (error)
continue;
locks_delete_block(fl);
break; break;
} }
locks_delete_block(fl);
return error; return error;
} }
@ -2476,6 +2592,7 @@ void locks_remove_posix(struct file *filp, fl_owner_t owner)
if (!ctx || list_empty(&ctx->flc_posix)) if (!ctx || list_empty(&ctx->flc_posix))
return; return;
locks_init_lock(&lock);
lock.fl_type = F_UNLCK; lock.fl_type = F_UNLCK;
lock.fl_flags = FL_POSIX | FL_CLOSE; lock.fl_flags = FL_POSIX | FL_CLOSE;
lock.fl_start = 0; lock.fl_start = 0;
@ -2492,26 +2609,21 @@ void locks_remove_posix(struct file *filp, fl_owner_t owner)
lock.fl_ops->fl_release_private(&lock); lock.fl_ops->fl_release_private(&lock);
trace_locks_remove_posix(inode, &lock, error); trace_locks_remove_posix(inode, &lock, error);
} }
EXPORT_SYMBOL(locks_remove_posix); EXPORT_SYMBOL(locks_remove_posix);
/* The i_flctx must be valid when calling into here */ /* The i_flctx must be valid when calling into here */
static void static void
locks_remove_flock(struct file *filp, struct file_lock_context *flctx) locks_remove_flock(struct file *filp, struct file_lock_context *flctx)
{ {
struct file_lock fl = { struct file_lock fl;
.fl_owner = filp,
.fl_pid = current->tgid,
.fl_file = filp,
.fl_flags = FL_FLOCK | FL_CLOSE,
.fl_type = F_UNLCK,
.fl_end = OFFSET_MAX,
};
struct inode *inode = locks_inode(filp); struct inode *inode = locks_inode(filp);
if (list_empty(&flctx->flc_flock)) if (list_empty(&flctx->flc_flock))
return; return;
flock_make_lock(filp, LOCK_UN, &fl);
fl.fl_flags |= FL_CLOSE;
if (filp->f_op->flock) if (filp->f_op->flock)
filp->f_op->flock(filp, F_SETLKW, &fl); filp->f_op->flock(filp, F_SETLKW, &fl);
else else
@ -2569,27 +2681,6 @@ void locks_remove_file(struct file *filp)
spin_unlock(&ctx->flc_lock); spin_unlock(&ctx->flc_lock);
} }
/**
* posix_unblock_lock - stop waiting for a file lock
* @waiter: the lock which was waiting
*
* lockd needs to block waiting for locks.
*/
int
posix_unblock_lock(struct file_lock *waiter)
{
int status = 0;
spin_lock(&blocked_lock_lock);
if (waiter->fl_next)
__locks_delete_block(waiter);
else
status = -ENOENT;
spin_unlock(&blocked_lock_lock);
return status;
}
EXPORT_SYMBOL(posix_unblock_lock);
/** /**
* vfs_cancel_lock - file byte range unblock lock * vfs_cancel_lock - file byte range unblock lock
* @filp: The file to apply the unblock to * @filp: The file to apply the unblock to
@ -2603,7 +2694,6 @@ int vfs_cancel_lock(struct file *filp, struct file_lock *fl)
return filp->f_op->lock(filp, F_CANCELLK, fl); return filp->f_op->lock(filp, F_CANCELLK, fl);
return 0; return 0;
} }
EXPORT_SYMBOL_GPL(vfs_cancel_lock); EXPORT_SYMBOL_GPL(vfs_cancel_lock);
#ifdef CONFIG_PROC_FS #ifdef CONFIG_PROC_FS
@ -2707,7 +2797,7 @@ static int locks_show(struct seq_file *f, void *v)
lock_get_status(f, fl, iter->li_pos, ""); lock_get_status(f, fl, iter->li_pos, "");
list_for_each_entry(bfl, &fl->fl_block, fl_block) list_for_each_entry(bfl, &fl->fl_blocked_requests, fl_blocked_member)
lock_get_status(f, bfl, iter->li_pos, " ->"); lock_get_status(f, bfl, iter->li_pos, " ->");
return 0; return 0;
@ -2803,7 +2893,6 @@ static int __init filelock_init(void)
filelock_cache = kmem_cache_create("file_lock_cache", filelock_cache = kmem_cache_create("file_lock_cache",
sizeof(struct file_lock), 0, SLAB_PANIC, NULL); sizeof(struct file_lock), 0, SLAB_PANIC, NULL);
for_each_possible_cpu(i) { for_each_possible_cpu(i) {
struct file_lock_list_struct *fll = per_cpu_ptr(&file_lock_list, i); struct file_lock_list_struct *fll = per_cpu_ptr(&file_lock_list, i);
@ -2813,5 +2902,4 @@ static int __init filelock_init(void)
return 0; return 0;
} }
core_initcall(filelock_init); core_initcall(filelock_init);

View File

@ -6311,7 +6311,8 @@ static struct nfs4_unlockdata *nfs4_alloc_unlockdata(struct file_lock *fl,
/* Ensure we don't close file until we're done freeing locks! */ /* Ensure we don't close file until we're done freeing locks! */
p->ctx = get_nfs_open_context(ctx); p->ctx = get_nfs_open_context(ctx);
p->l_ctx = nfs_get_lock_context(ctx); p->l_ctx = nfs_get_lock_context(ctx);
memcpy(&p->fl, fl, sizeof(p->fl)); locks_init_lock(&p->fl);
locks_copy_lock(&p->fl, fl);
p->server = NFS_SERVER(inode); p->server = NFS_SERVER(inode);
return p; return p;
} }
@ -6533,7 +6534,8 @@ static struct nfs4_lockdata *nfs4_alloc_lockdata(struct file_lock *fl,
p->server = server; p->server = server;
refcount_inc(&lsp->ls_count); refcount_inc(&lsp->ls_count);
p->ctx = get_nfs_open_context(ctx); p->ctx = get_nfs_open_context(ctx);
memcpy(&p->fl, fl, sizeof(p->fl)); locks_init_lock(&p->fl);
locks_copy_lock(&p->fl, fl);
return p; return p;
out_free_seqid: out_free_seqid:
nfs_free_seqid(p->arg.open_seqid); nfs_free_seqid(p->arg.open_seqid);

View File

@ -238,7 +238,7 @@ find_blocked_lock(struct nfs4_lockowner *lo, struct knfsd_fh *fh,
} }
spin_unlock(&nn->blocked_locks_lock); spin_unlock(&nn->blocked_locks_lock);
if (found) if (found)
posix_unblock_lock(&found->nbl_lock); locks_delete_block(&found->nbl_lock);
return found; return found;
} }
@ -293,7 +293,7 @@ remove_blocked_locks(struct nfs4_lockowner *lo)
nbl = list_first_entry(&reaplist, struct nfsd4_blocked_lock, nbl = list_first_entry(&reaplist, struct nfsd4_blocked_lock,
nbl_lru); nbl_lru);
list_del_init(&nbl->nbl_lru); list_del_init(&nbl->nbl_lru);
posix_unblock_lock(&nbl->nbl_lock); locks_delete_block(&nbl->nbl_lock);
free_blocked_lock(nbl); free_blocked_lock(nbl);
} }
} }
@ -4863,7 +4863,7 @@ nfs4_laundromat(struct nfsd_net *nn)
nbl = list_first_entry(&reaplist, nbl = list_first_entry(&reaplist,
struct nfsd4_blocked_lock, nbl_lru); struct nfsd4_blocked_lock, nbl_lru);
list_del_init(&nbl->nbl_lru); list_del_init(&nbl->nbl_lru);
posix_unblock_lock(&nbl->nbl_lock); locks_delete_block(&nbl->nbl_lock);
free_blocked_lock(nbl); free_blocked_lock(nbl);
} }
out: out:

View File

@ -52,6 +52,7 @@ static int ocfs2_do_flock(struct file *file, struct inode *inode,
if (lockres->l_flags & OCFS2_LOCK_ATTACHED && if (lockres->l_flags & OCFS2_LOCK_ATTACHED &&
lockres->l_level > LKM_NLMODE) { lockres->l_level > LKM_NLMODE) {
int old_level = 0; int old_level = 0;
struct file_lock request;
if (lockres->l_level == LKM_EXMODE) if (lockres->l_level == LKM_EXMODE)
old_level = 1; old_level = 1;
@ -66,11 +67,10 @@ static int ocfs2_do_flock(struct file *file, struct inode *inode,
* level. * level.
*/ */
locks_lock_file_wait(file, locks_init_lock(&request);
&(struct file_lock) { request.fl_type = F_UNLCK;
.fl_type = F_UNLCK, request.fl_flags = FL_FLOCK;
.fl_flags = FL_FLOCK locks_lock_file_wait(file, &request);
});
ocfs2_file_unlock(file); ocfs2_file_unlock(file);
} }

View File

@ -1044,10 +1044,15 @@ bool opens_in_grace(struct net *);
* Obviously, the last two criteria only matter for POSIX locks. * Obviously, the last two criteria only matter for POSIX locks.
*/ */
struct file_lock { struct file_lock {
struct file_lock *fl_next; /* singly linked list for this inode */ struct file_lock *fl_blocker; /* The lock, that is blocking us */
struct list_head fl_list; /* link into file_lock_context */ struct list_head fl_list; /* link into file_lock_context */
struct hlist_node fl_link; /* node in global lists */ struct hlist_node fl_link; /* node in global lists */
struct list_head fl_block; /* circular list of blocked processes */ struct list_head fl_blocked_requests; /* list of requests with
* ->fl_blocker pointing here
*/
struct list_head fl_blocked_member; /* node in
* ->fl_blocker->fl_blocked_requests
*/
fl_owner_t fl_owner; fl_owner_t fl_owner;
unsigned int fl_flags; unsigned int fl_flags;
unsigned char fl_type; unsigned char fl_type;
@ -1119,7 +1124,7 @@ extern void locks_remove_file(struct file *);
extern void locks_release_private(struct file_lock *); extern void locks_release_private(struct file_lock *);
extern void posix_test_lock(struct file *, struct file_lock *); extern void posix_test_lock(struct file *, struct file_lock *);
extern int posix_lock_file(struct file *, struct file_lock *, struct file_lock *); extern int posix_lock_file(struct file *, struct file_lock *, struct file_lock *);
extern int posix_unblock_lock(struct file_lock *); extern int locks_delete_block(struct file_lock *);
extern int vfs_test_lock(struct file *, struct file_lock *); extern int vfs_test_lock(struct file *, struct file_lock *);
extern int vfs_lock_file(struct file *, unsigned int, struct file_lock *, struct file_lock *); extern int vfs_lock_file(struct file *, unsigned int, struct file_lock *, struct file_lock *);
extern int vfs_cancel_lock(struct file *filp, struct file_lock *fl); extern int vfs_cancel_lock(struct file *filp, struct file_lock *fl);
@ -1209,7 +1214,7 @@ static inline int posix_lock_file(struct file *filp, struct file_lock *fl,
return -ENOLCK; return -ENOLCK;
} }
static inline int posix_unblock_lock(struct file_lock *waiter) static inline int locks_delete_block(struct file_lock *waiter)
{ {
return -ENOENT; return -ENOENT;
} }

View File

@ -68,7 +68,7 @@ DECLARE_EVENT_CLASS(filelock_lock,
__field(struct file_lock *, fl) __field(struct file_lock *, fl)
__field(unsigned long, i_ino) __field(unsigned long, i_ino)
__field(dev_t, s_dev) __field(dev_t, s_dev)
__field(struct file_lock *, fl_next) __field(struct file_lock *, fl_blocker)
__field(fl_owner_t, fl_owner) __field(fl_owner_t, fl_owner)
__field(unsigned int, fl_pid) __field(unsigned int, fl_pid)
__field(unsigned int, fl_flags) __field(unsigned int, fl_flags)
@ -82,7 +82,7 @@ DECLARE_EVENT_CLASS(filelock_lock,
__entry->fl = fl ? fl : NULL; __entry->fl = fl ? fl : NULL;
__entry->s_dev = inode->i_sb->s_dev; __entry->s_dev = inode->i_sb->s_dev;
__entry->i_ino = inode->i_ino; __entry->i_ino = inode->i_ino;
__entry->fl_next = fl ? fl->fl_next : NULL; __entry->fl_blocker = fl ? fl->fl_blocker : NULL;
__entry->fl_owner = fl ? fl->fl_owner : NULL; __entry->fl_owner = fl ? fl->fl_owner : NULL;
__entry->fl_pid = fl ? fl->fl_pid : 0; __entry->fl_pid = fl ? fl->fl_pid : 0;
__entry->fl_flags = fl ? fl->fl_flags : 0; __entry->fl_flags = fl ? fl->fl_flags : 0;
@ -92,9 +92,9 @@ DECLARE_EVENT_CLASS(filelock_lock,
__entry->ret = ret; __entry->ret = ret;
), ),
TP_printk("fl=0x%p dev=0x%x:0x%x ino=0x%lx fl_next=0x%p fl_owner=0x%p fl_pid=%u fl_flags=%s fl_type=%s fl_start=%lld fl_end=%lld ret=%d", TP_printk("fl=0x%p dev=0x%x:0x%x ino=0x%lx fl_blocker=0x%p fl_owner=0x%p fl_pid=%u fl_flags=%s fl_type=%s fl_start=%lld fl_end=%lld ret=%d",
__entry->fl, MAJOR(__entry->s_dev), MINOR(__entry->s_dev), __entry->fl, MAJOR(__entry->s_dev), MINOR(__entry->s_dev),
__entry->i_ino, __entry->fl_next, __entry->fl_owner, __entry->i_ino, __entry->fl_blocker, __entry->fl_owner,
__entry->fl_pid, show_fl_flags(__entry->fl_flags), __entry->fl_pid, show_fl_flags(__entry->fl_flags),
show_fl_type(__entry->fl_type), show_fl_type(__entry->fl_type),
__entry->fl_start, __entry->fl_end, __entry->ret) __entry->fl_start, __entry->fl_end, __entry->ret)
@ -125,7 +125,7 @@ DECLARE_EVENT_CLASS(filelock_lease,
__field(struct file_lock *, fl) __field(struct file_lock *, fl)
__field(unsigned long, i_ino) __field(unsigned long, i_ino)
__field(dev_t, s_dev) __field(dev_t, s_dev)
__field(struct file_lock *, fl_next) __field(struct file_lock *, fl_blocker)
__field(fl_owner_t, fl_owner) __field(fl_owner_t, fl_owner)
__field(unsigned int, fl_flags) __field(unsigned int, fl_flags)
__field(unsigned char, fl_type) __field(unsigned char, fl_type)
@ -137,7 +137,7 @@ DECLARE_EVENT_CLASS(filelock_lease,
__entry->fl = fl ? fl : NULL; __entry->fl = fl ? fl : NULL;
__entry->s_dev = inode->i_sb->s_dev; __entry->s_dev = inode->i_sb->s_dev;
__entry->i_ino = inode->i_ino; __entry->i_ino = inode->i_ino;
__entry->fl_next = fl ? fl->fl_next : NULL; __entry->fl_blocker = fl ? fl->fl_blocker : NULL;
__entry->fl_owner = fl ? fl->fl_owner : NULL; __entry->fl_owner = fl ? fl->fl_owner : NULL;
__entry->fl_flags = fl ? fl->fl_flags : 0; __entry->fl_flags = fl ? fl->fl_flags : 0;
__entry->fl_type = fl ? fl->fl_type : 0; __entry->fl_type = fl ? fl->fl_type : 0;
@ -145,9 +145,9 @@ DECLARE_EVENT_CLASS(filelock_lease,
__entry->fl_downgrade_time = fl ? fl->fl_downgrade_time : 0; __entry->fl_downgrade_time = fl ? fl->fl_downgrade_time : 0;
), ),
TP_printk("fl=0x%p dev=0x%x:0x%x ino=0x%lx fl_next=0x%p fl_owner=0x%p fl_flags=%s fl_type=%s fl_break_time=%lu fl_downgrade_time=%lu", TP_printk("fl=0x%p dev=0x%x:0x%x ino=0x%lx fl_blocker=0x%p fl_owner=0x%p fl_flags=%s fl_type=%s fl_break_time=%lu fl_downgrade_time=%lu",
__entry->fl, MAJOR(__entry->s_dev), MINOR(__entry->s_dev), __entry->fl, MAJOR(__entry->s_dev), MINOR(__entry->s_dev),
__entry->i_ino, __entry->fl_next, __entry->fl_owner, __entry->i_ino, __entry->fl_blocker, __entry->fl_owner,
show_fl_flags(__entry->fl_flags), show_fl_flags(__entry->fl_flags),
show_fl_type(__entry->fl_type), show_fl_type(__entry->fl_type),
__entry->fl_break_time, __entry->fl_downgrade_time) __entry->fl_break_time, __entry->fl_downgrade_time)