Move FASYNC bit handling to f_op->fasync()
Removing the BKL from FASYNC handling ran into the challenge of keeping the setting of the FASYNC bit in filp->f_flags atomic with regard to calls to the underlying fasync() function. Andi Kleen suggested moving the handling of that bit into fasync(); this patch does exactly that. As a result, we have a couple of internal API changes: fasync() must now manage the FASYNC bit, and it will be called without the BKL held. As it happens, every fasync() implementation in the kernel with one exception calls fasync_helper(). So, if we make fasync_helper() set the FASYNC bit, we can avoid making any changes to the other fasync() functions - as long as those functions, themselves, have proper locking. Most fasync() implementations do nothing but call fasync_helper() - which has its own lock - so they are easily verified as correct. The BKL had already been pushed down into the rest. The networking code has its own version of fasync_helper(), so that code has been augmented with explicit FASYNC bit handling. Cc: Al Viro <viro@ZenIV.linux.org.uk> Cc: David Miller <davem@davemloft.net> Reviewed-by: Christoph Hellwig <hch@lst.de> Signed-off-by: Jonathan Corbet <corbet@lwn.net>
This commit is contained in:
		
							parent
							
								
									db1dd4d376
								
							
						
					
					
						commit
						76398425bb
					
				| @ -437,8 +437,11 @@ grab BKL for cases when we close a file that had been opened r/w, but that | ||||
| can and should be done using the internal locking with smaller critical areas). | ||||
| Current worst offender is ext2_get_block()... | ||||
| 
 | ||||
| ->fasync() is a mess. This area needs a big cleanup and that will probably | ||||
| affect locking. | ||||
| ->fasync() is called without BKL protection, and is responsible for | ||||
| maintaining the FASYNC bit in filp->f_flags.  Most instances call | ||||
| fasync_helper(), which does that maintenance, so it's not normally | ||||
| something one needs to worry about.  Return values > 0 will be mapped to | ||||
| zero in the VFS layer. | ||||
| 
 | ||||
| ->readdir() and ->ioctl() on directories must be changed. Ideally we would | ||||
| move ->readdir() to inode_operations and use a separate method for directory | ||||
|  | ||||
							
								
								
									
										29
									
								
								fs/fcntl.c
									
									
									
									
									
								
							
							
						
						
									
										29
									
								
								fs/fcntl.c
									
									
									
									
									
								
							| @ -141,7 +141,7 @@ SYSCALL_DEFINE1(dup, unsigned int, fildes) | ||||
| 	return ret; | ||||
| } | ||||
| 
 | ||||
| #define SETFL_MASK (O_APPEND | O_NONBLOCK | O_NDELAY | FASYNC | O_DIRECT | O_NOATIME) | ||||
| #define SETFL_MASK (O_APPEND | O_NONBLOCK | O_NDELAY | O_DIRECT | O_NOATIME) | ||||
| 
 | ||||
| static int setfl(int fd, struct file * filp, unsigned long arg) | ||||
| { | ||||
| @ -177,23 +177,19 @@ static int setfl(int fd, struct file * filp, unsigned long arg) | ||||
| 		return error; | ||||
| 
 | ||||
| 	/*
 | ||||
| 	 * We still need a lock here for now to keep multiple FASYNC calls | ||||
| 	 * from racing with each other. | ||||
| 	 * ->fasync() is responsible for setting the FASYNC bit. | ||||
| 	 */ | ||||
| 	lock_kernel(); | ||||
| 	if ((arg ^ filp->f_flags) & FASYNC) { | ||||
| 		if (filp->f_op && filp->f_op->fasync) { | ||||
| 			error = filp->f_op->fasync(fd, filp, (arg & FASYNC) != 0); | ||||
| 			if (error < 0) | ||||
| 				goto out; | ||||
| 		} | ||||
| 	if (((arg ^ filp->f_flags) & FASYNC) && filp->f_op && | ||||
| 			filp->f_op->fasync) { | ||||
| 		error = filp->f_op->fasync(fd, filp, (arg & FASYNC) != 0); | ||||
| 		if (error < 0) | ||||
| 			goto out; | ||||
| 	} | ||||
| 
 | ||||
| 	spin_lock(&filp->f_lock); | ||||
| 	filp->f_flags = (arg & SETFL_MASK) | (filp->f_flags & ~SETFL_MASK); | ||||
| 	spin_unlock(&filp->f_lock); | ||||
| 
 | ||||
|  out: | ||||
| 	unlock_kernel(); | ||||
| 	return error; | ||||
| } | ||||
| 
 | ||||
| @ -518,7 +514,7 @@ static DEFINE_RWLOCK(fasync_lock); | ||||
| static struct kmem_cache *fasync_cache __read_mostly; | ||||
| 
 | ||||
| /*
 | ||||
|  * fasync_helper() is used by some character device drivers (mainly mice) | ||||
|  * fasync_helper() is used by almost all character device drivers | ||||
|  * to set up the fasync queue. It returns negative on error, 0 if it did | ||||
|  * no changes and positive if it added/deleted the entry. | ||||
|  */ | ||||
| @ -557,6 +553,13 @@ int fasync_helper(int fd, struct file * filp, int on, struct fasync_struct **fap | ||||
| 		result = 1; | ||||
| 	} | ||||
| out: | ||||
| 	/* Fix up FASYNC bit while still holding fasync_lock */ | ||||
| 	spin_lock(&filp->f_lock); | ||||
| 	if (on) | ||||
| 		filp->f_flags |= FASYNC; | ||||
| 	else | ||||
| 		filp->f_flags &= ~FASYNC; | ||||
| 	spin_unlock(&filp->f_lock); | ||||
| 	write_unlock_irq(&fasync_lock); | ||||
| 	return result; | ||||
| } | ||||
|  | ||||
							
								
								
									
										13
									
								
								fs/ioctl.c
									
									
									
									
									
								
							
							
						
						
									
										13
									
								
								fs/ioctl.c
									
									
									
									
									
								
							| @ -427,19 +427,11 @@ static int ioctl_fioasync(unsigned int fd, struct file *filp, | ||||
| 	/* Did FASYNC state change ? */ | ||||
| 	if ((flag ^ filp->f_flags) & FASYNC) { | ||||
| 		if (filp->f_op && filp->f_op->fasync) | ||||
| 			/* fasync() adjusts filp->f_flags */ | ||||
| 			error = filp->f_op->fasync(fd, filp, on); | ||||
| 		else | ||||
| 			error = -ENOTTY; | ||||
| 	} | ||||
| 	if (error) | ||||
| 		return error; | ||||
| 
 | ||||
| 	spin_lock(&filp->f_lock); | ||||
| 	if (on) | ||||
| 		filp->f_flags |= FASYNC; | ||||
| 	else | ||||
| 		filp->f_flags &= ~FASYNC; | ||||
| 	spin_unlock(&filp->f_lock); | ||||
| 	return error; | ||||
| } | ||||
| 
 | ||||
| @ -507,10 +499,7 @@ int do_vfs_ioctl(struct file *filp, unsigned int fd, unsigned int cmd, | ||||
| 		break; | ||||
| 
 | ||||
| 	case FIOASYNC: | ||||
| 		/* BKL needed to avoid races tweaking f_flags */ | ||||
| 		lock_kernel(); | ||||
| 		error = ioctl_fioasync(fd, filp, argp); | ||||
| 		unlock_kernel(); | ||||
| 		break; | ||||
| 
 | ||||
| 	case FIOQSIZE: | ||||
|  | ||||
| @ -1030,6 +1030,13 @@ static int sock_fasync(int fd, struct file *filp, int on) | ||||
| 
 | ||||
| 	lock_sock(sk); | ||||
| 
 | ||||
| 	spin_lock(&filp->f_lock); | ||||
| 	if (on) | ||||
| 		filp->f_flags |= FASYNC; | ||||
| 	else | ||||
| 		filp->f_flags &= ~FASYNC; | ||||
| 	spin_unlock(&filp->f_lock); | ||||
| 
 | ||||
| 	prev = &(sock->fasync_list); | ||||
| 
 | ||||
| 	for (fa = *prev; fa != NULL; prev = &fa->fa_next, fa = *prev) | ||||
|  | ||||
		Loading…
	
		Reference in New Issue
	
	Block a user