In designing a streaming media application, I want to use a single event processing loop for both disk and network I/O. The idea is that the I/O done in this loop should never block. Doing this for network I/O is pretty standard (i.e. set O_NONBLOCK and use a poll variant).
Asynchronous/nonblocking file I/O has its limitations, however. AIO can only be used in conjunction with O_DIRECT, and I'd rather be able to utilize the page cache. Even so, it is difficult to mix io_getevents with poll in a single event loop. You could use mmap/mincore, but there is still a race between the mincore call and the actual read of the data. So, have I missed any other tools which would help to solve this problem? It seems that if we introduced a nonblocking flag for file I/O, this problem would be addressed. Call it O_ATOMICREAD or some such thing. It's actually quite easy to do (patch attached). I even went so far as to modify squid's aufs store type to use this, so there is use outside of just the streaming media example given above (though I haven't had time to benchmark it). Comments? Thanks in advance, Jeff
--- linux-2.6.11/fs/fcntl.c.orig 2005-03-17 13:48:28.302745792 -0500 +++ linux-2.6.11/fs/fcntl.c 2005-03-17 13:48:48.203720384 -0500 @@ -181,7 +181,7 @@ asmlinkage long sys_dup(unsigned int fil return ret; } -#define SETFL_MASK (O_APPEND | O_NONBLOCK | O_NDELAY | FASYNC | O_DIRECT | O_NOATIME) +#define SETFL_MASK (O_APPEND | O_NONBLOCK | O_NDELAY | FASYNC | O_DIRECT | O_NOATIME | O_ATOMICREAD) static int setfl(int fd, struct file * filp, unsigned long arg) { --- linux-2.6.11/include/asm-mips/fcntl.h.orig 2005-03-17 14:01:08.039248288 -0500 +++ linux-2.6.11/include/asm-mips/fcntl.h 2005-03-17 14:01:30.365854128 -0500 @@ -27,6 +27,7 @@ #define O_DIRECTORY 0x10000 /* must be a directory */ #define O_NOFOLLOW 0x20000 /* don't follow links */ #define O_NOATIME 0x40000 +#define O_ATOMICREAD 0x80000 /* non-blocking file i/o */ #define O_NDELAY O_NONBLOCK --- linux-2.6.11/include/asm-parisc/fcntl.h.orig 2005-03-17 14:02:01.120178760 -0500 +++ linux-2.6.11/include/asm-parisc/fcntl.h 2005-03-17 14:02:02.160020680 -0500 @@ -20,6 +20,7 @@ #define O_DSYNC 01000000 /* HPUX only */ #define O_RSYNC 02000000 /* HPUX only */ #define O_NOATIME 04000000 +#define O_ATOMICREAD 10000000 /* non-blocking file i/o */ #define FASYNC 00020000 /* fcntl, for BSD compatibility */ #define O_DIRECT 00040000 /* direct disk access hint - currently ignored */ --- linux-2.6.11/include/asm-ppc64/fcntl.h.orig 2005-03-17 13:57:16.464453008 -0500 +++ linux-2.6.11/include/asm-ppc64/fcntl.h 2005-03-17 13:57:26.291959000 -0500 @@ -28,6 +28,7 @@ #define O_LARGEFILE 0200000 #define O_DIRECT 0400000 /* direct disk access hint */ #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-x86_64/fcntl.h.orig 2005-03-17 13:56:19.711080832 -0500 +++ linux-2.6.11/include/asm-x86_64/fcntl.h 2005-03-17 13:56:24.575341352 -0500 @@ -21,6 +21,7 @@ #define O_DIRECTORY 0200000 /* must be a directory */ #define O_NOFOLLOW 0400000 /* don't follow links */ #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-arm/fcntl.h.orig 2005-03-17 13:58:49.073374312 -0500 +++ linux-2.6.11/include/asm-arm/fcntl.h 2005-03-17 13:58:50.032228544 -0500 @@ -21,6 +21,7 @@ #define O_DIRECT 0200000 /* direct disk access hint - currently ignored */ #define O_LARGEFILE 0400000 #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-m68k/fcntl.h.orig 2005-03-17 14:00:32.230692016 -0500 +++ linux-2.6.11/include/asm-m68k/fcntl.h 2005-03-17 14:00:33.107558712 -0500 @@ -21,6 +21,7 @@ #define O_DIRECT 0200000 /* direct disk access hint - currently ignored */ #define O_LARGEFILE 0400000 #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-ppc/fcntl.h.orig 2005-03-17 13:56:56.661463520 -0500 +++ linux-2.6.11/include/asm-ppc/fcntl.h 2005-03-17 13:57:07.509814320 -0500 @@ -21,6 +21,7 @@ #define O_LARGEFILE 0200000 #define O_DIRECT 0400000 /* direct disk access hint */ #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-sparc/fcntl.h.orig 2005-03-17 14:02:57.827557928 -0500 +++ linux-2.6.11/include/asm-sparc/fcntl.h 2005-03-17 14:02:58.682427968 -0500 @@ -22,6 +22,7 @@ #define O_LARGEFILE 0x40000 #define O_DIRECT 0x100000 /* direct disk access hint */ #define O_NOATIME 0x200000 +#define O_ATOMICREAD 0x400000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-alpha/fcntl.h.orig 2005-03-17 13:58:22.624395168 -0500 +++ linux-2.6.11/include/asm-alpha/fcntl.h 2005-03-17 13:58:23.599246968 -0500 @@ -22,6 +22,7 @@ #define O_LARGEFILE 0400000 /* will be set by the kernel on every open */ #define O_DIRECT 02000000 /* direct disk access - should check with OSF/1 */ #define O_NOATIME 04000000 +#define O_ATOMICREAD 10000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-v850/fcntl.h.orig 2005-03-17 14:03:45.439319840 -0500 +++ linux-2.6.11/include/asm-v850/fcntl.h 2005-03-17 14:03:46.312187144 -0500 @@ -21,6 +21,7 @@ #define O_DIRECT 0200000 /* direct disk access hint - currently ignored */ #define O_LARGEFILE 0400000 #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-i386/fcntl.h.orig 2005-03-17 13:55:43.761545992 -0500 +++ linux-2.6.11/include/asm-i386/fcntl.h 2005-03-17 13:56:02.172747064 -0500 @@ -21,6 +21,7 @@ #define O_DIRECTORY 0200000 /* must be a directory */ #define O_NOFOLLOW 0400000 /* don't follow links */ #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-frv/fcntl.h.orig 2005-03-17 13:59:33.734584776 -0500 +++ linux-2.6.11/include/asm-frv/fcntl.h 2005-03-17 13:59:34.580456184 -0500 @@ -21,6 +21,7 @@ #define O_DIRECTORY 0200000 /* must be a directory */ #define O_NOFOLLOW 0400000 /* don't follow links */ #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-m32r/fcntl.h.orig 2005-03-17 14:00:13.786495960 -0500 +++ linux-2.6.11/include/asm-m32r/fcntl.h 2005-03-17 14:00:14.661362960 -0500 @@ -25,6 +25,7 @@ #define O_DIRECTORY 0200000 /* must be a directory */ #define O_NOFOLLOW 0400000 /* don't follow links */ #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-h8300/fcntl.h.orig 2005-03-17 13:59:56.604108080 -0500 +++ linux-2.6.11/include/asm-h8300/fcntl.h 2005-03-17 13:59:57.522968392 -0500 @@ -21,6 +21,7 @@ #define O_DIRECT 0200000 /* direct disk access hint - currently ignored */ #define O_LARGEFILE 0400000 #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-s390/fcntl.h.orig 2005-03-17 13:57:42.654471520 -0500 +++ linux-2.6.11/include/asm-s390/fcntl.h 2005-03-17 13:57:43.860288208 -0500 @@ -28,6 +28,7 @@ #define O_DIRECTORY 0200000 /* must be a directory */ #define O_NOFOLLOW 0400000 /* don't follow links */ #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-ia64/fcntl.h.orig 2005-03-17 13:56:44.119370208 -0500 +++ linux-2.6.11/include/asm-ia64/fcntl.h 2005-03-17 13:56:46.889949016 -0500 @@ -29,6 +29,7 @@ #define O_DIRECTORY 0200000 /* must be a directory */ #define O_NOFOLLOW 0400000 /* don't follow links */ #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-cris/fcntl.h.orig 2005-03-17 13:59:20.996521256 -0500 +++ linux-2.6.11/include/asm-cris/fcntl.h 2005-03-17 13:59:22.037363024 -0500 @@ -23,6 +23,7 @@ #define O_DIRECTORY 0200000 /* must be a directory */ #define O_NOFOLLOW 0400000 /* don't follow links */ #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get f_flags */ --- linux-2.6.11/include/asm-sparc64/fcntl.h.orig 2005-03-17 14:03:18.313443600 -0500 +++ linux-2.6.11/include/asm-sparc64/fcntl.h 2005-03-17 14:03:19.482265912 -0500 @@ -22,6 +22,7 @@ #define O_LARGEFILE 0x40000 #define O_DIRECT 0x100000 /* direct disk access hint */ #define O_NOATIME 0x200000 +#define O_ATOMICREAD 0x400000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ --- linux-2.6.11/include/asm-arm26/fcntl.h.orig 2005-03-17 13:59:04.970957512 -0500 +++ linux-2.6.11/include/asm-arm26/fcntl.h 2005-03-17 13:59:06.485727232 -0500 @@ -21,6 +21,7 @@ #define O_DIRECT 0200000 /* direct disk access hint - currently ignored */ #define O_LARGEFILE 0400000 #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/include/asm-sh/fcntl.h.orig 2005-03-17 14:02:16.734804976 -0500 +++ linux-2.6.11/include/asm-sh/fcntl.h 2005-03-17 14:02:24.028696136 -0500 @@ -21,6 +21,7 @@ #define O_DIRECTORY 0200000 /* must be a directory */ #define O_NOFOLLOW 0400000 /* don't follow links */ #define O_NOATIME 01000000 +#define O_ATOMICREAD 02000000 /* non-blocking file i/o */ #define F_DUPFD 0 /* dup */ #define F_GETFD 1 /* get close_on_exec */ --- linux-2.6.11/mm/filemap.c.orig 2005-03-17 13:37:48.270045552 -0500 +++ linux-2.6.11/mm/filemap.c 2005-03-17 13:48:20.594917560 -0500 @@ -696,7 +696,7 @@ void do_generic_mapping_read(struct addr unsigned long prev_index; loff_t isize; struct page *cached_page; - int error; + int error, nonblock = filp->f_flags & O_ATOMICREAD; struct file_ra_state ra = *_ra; cached_page = NULL; @@ -728,7 +728,7 @@ void do_generic_mapping_read(struct addr nr = nr - offset; cond_resched(); - if (index == next_index && req_size) { + if (index == next_index && req_size && !nonblock) { ret_size = page_cache_readahead(mapping, &ra, filp, index, req_size); next_index += ret_size; @@ -738,11 +738,21 @@ void do_generic_mapping_read(struct addr find_page: page = find_get_page(mapping, index); if (unlikely(page == NULL)) { + if (nonblock) { + desc->error = -EWOULDBLOCK; + break; + } handle_ra_miss(mapping, &ra, index); goto no_cached_page; } - if (!PageUptodate(page)) + if (!PageUptodate(page)) { + if (nonblock) { + page_cache_release(page); + desc->error = -EWOULDBLOCK; + break; + } goto page_not_up_to_date; + } page_ok: /* If users can be writing to this page using arbitrary @@ -1000,7 +1010,7 @@ __generic_file_aio_read(struct kiocb *io desc.error = 0; do_generic_file_read(filp,ppos,&desc,file_read_actor); retval += desc.written; - if (!retval) { + if (!retval || desc.error) { retval = desc.error; break; }