File change notification

From: Rüdiger Klaehn
Date: Wed Dec 31 2003 - 09:37:03 EST


Hi everybody.

This is my first post to lkml, so please be patient with me

I have been wondering for some time why there is no decent file change notification mechanism in linux. Is there some deep philosophical reason for this, or is it just that nobody has found the time to implement it? If it is the latter, I am willing to implement it as long there is a chance to get this accepted into the mainstream kernel.

Is there already somebody working on this problem? I know a few efforts that try to do something similar, but they all work by intercepting every single system call that has to do with files, and they are thus not very fast. See for example
<http://www.bangstate.com/software.html#changedfiles>
<http://cvs.sourceforge.net/cgi-bin/viewcvs.cgi/openxdsm/openxdsm/eventmodule/>


The dnotify mechanism is very limited since it requires a file handle, it is not working for whole directory trees and it does not report much useful information. For example to watch for changes in the /home tree you would have to open every single directory in the tree, which would probably not even work since it would require more than the maximum number of file handles. If you have a directory with many files in it, the only thing dnotify tells you is that something has changed in the directory, so you have to rescan the whole directory to find out which file has changed. Kind of defeats the purpose of change notification...

What I would like to have would be some way to watch for certain changes anywhere in a whole tree or even the whole file system. This new mechanism should have no measurable performance impact and should log all information that is readily available. The amount of new code in kernel space should be as small as possible. So complicated stuff like pattern matching would have to happen in user space.

I wrote some experimental mechanism yesterday. Whenever a file is accessed or changed, I write all easily available information to a ring buffer which is presented to user space as a device. The information that is easily available is the inode number of the file or directory that has changed, the inode number of the directory in which the change took place, and in most cases the name of the dentry of the file that has changed.

Here is the struct I use for logging:

typedef struct
{
unsigned long event; /* the type of change. As of now, I use the same constants as dnotify */
unsigned long file_ino; /* the inode of the file that has changed (if available) */
unsigned long src_ino; /* the inode of the directory in which the change took place (if available) */
unsigned long dst_ino; /* the inode of the destination directory. This is only used when logging moves */
unsigned char name[DNAME_LEN]; /* the name of the dentry of the changed file. This is simply truncated if it is too long. */
} inotify_info;

Information that is not easily available and therefore not logged includes the full path(s) of the changed file/directory. If you want or need that, you will have to look it up in user space.

Since I only log information that can be gathered at practically no cost, the logging does not take any noticeable time in kernel space.

I attached a patch containing the code I wrote yesterday. This is very preliminary and probably not bug-free. I would like to have feedback on the general approach before I spend more time refining this.

best regards,

Rüdiger Klaehn


diff -urN -X dontdiff vanilla/fs/dnotify.c develop/fs/dnotify.c
--- vanilla/fs/dnotify.c 2003-10-17 23:43:00.000000000 +0200
+++ develop/fs/dnotify.c 2003-12-31 16:59:36.000000000 +0100
@@ -153,8 +153,9 @@
void dnotify_parent(struct dentry *dentry, unsigned long event)
{
struct dentry *parent;
-
spin_lock(&dentry->d_lock);
+ /* call inotify for this dentry */
+ inotify_dentrychange(dentry,event);
parent = dentry->d_parent;
if (parent->d_inode->i_dnotify_mask & event) {
dget(parent);
diff -urN -X dontdiff vanilla/fs/inotify.c develop/fs/inotify.c
--- vanilla/fs/inotify.c 1970-01-01 01:00:00.000000000 +0100
+++ develop/fs/inotify.c 2003-12-31 16:59:39.000000000 +0100
@@ -0,0 +1,306 @@
+/*
+ * Inode notifications for Linux.
+ *
+ * Copyright (C) 2003,2004 Rüdiger Klaehn
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation; either version 2, or (at your option) any
+ * later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * General Public License for more details.
+ */
+#ifdef HAVE_CONFIG_H
+#include "../config.h"
+#endif
+
+#include <linux/slab.h>
+#include <linux/kernel.h>
+#include <linux/module.h>
+#include <linux/fs.h>
+#include <linux/sched.h>
+#include <linux/init.h>
+#include <asm/segment.h>
+#include <asm/uaccess.h>
+#include <linux/string.h>
+#include <linux/types.h>
+#include <linux/smp_lock.h>
+#include <asm/segment.h>
+
+#define BUFFER_LEN 512
+#define DNAME_LEN 32
+#define IGNORE_LEN 16
+#define DEBUG 2
+
+typedef struct
+{
+ unsigned long event;
+ unsigned long file_ino;
+ unsigned long src_ino;
+ unsigned long dst_ino;
+ unsigned char name[DNAME_LEN];
+} in_info;
+
+/* The ring buffer. Statically allocated as of now */
+in_info in_buffer[BUFFER_LEN];
+int in_buffer_head = 0;
+int in_buffer_tail = 0;
+spinlock_t in_lock = SPIN_LOCK_UNLOCKED;
+unsigned long lock_flags;
+unsigned long in_ignore[IGNORE_LEN];
+
+/* device info for the in device */
+static int in_major = 40;
+
+int add_ignore_ino(unsigned long ino)
+{
+ int i;
+ for(i=0;i<IGNORE_LEN;i++)
+ if(in_ignore[i]==0)
+ {
+ in_ignore[i]=ino;
+ return 1;
+ }
+ return 0;
+}
+
+int remove_ignore_ino(unsigned long ino)
+{
+ int i;
+ for(i=0;i<IGNORE_LEN;i++)
+ if(in_ignore[i]==ino)
+ {
+ in_ignore[i]=0;
+ return 1;
+ }
+ return 0;
+}
+
+int test_ignore_ino(unsigned long ino)
+{
+ int i;
+ if(!ino)
+ return 1;
+ for(i=0;i<IGNORE_LEN;i++)
+ if(in_ignore[i]==ino)
+ return 1;
+ return 0;
+}
+
+int in_get_from_buffer(in_info *info)
+{
+ spin_lock_irqsave(&in_lock, lock_flags);
+ if (in_buffer_head == in_buffer_tail)
+ {
+ spin_unlock_irqrestore( &in_lock, lock_flags );
+ return 0;
+ }
+ memcpy(info,&in_buffer[in_buffer_head],sizeof(in_info));
+ memset(&in_buffer[in_buffer_head],0,sizeof(in_info));
+ in_buffer_head++;
+ if(in_buffer_head == BUFFER_LEN) in_buffer_head=0;
+ spin_unlock_irqrestore( &in_lock, lock_flags );
+ return 1;
+}
+
+int in_put_to_buffer(in_info *info)
+{
+ #if DEBUG>2
+ printk("in: put_to_buffer: %ld %ld %ld %ld\n",
+ info->event,info->file_ino,info->src_ino,info->dst_ino);
+ #endif
+ spin_lock_irqsave(&in_lock, lock_flags);
+ if((in_buffer_tail + 1) == in_buffer_head || (
+ ((in_buffer_tail + 1) == BUFFER_LEN) &&
+ ( in_buffer_head == 0 ) ))
+ {
+ /* Buffer overrun. Drop one entry! */
+ in_buffer_head++;
+ if ( in_buffer_head == BUFFER_LEN )
+ {
+ in_buffer_head = 0;
+ }
+ /*signal changedfiles_buffer overrun*/
+ /*strncpy( (char *)changedfiles_buffer[cf_buffer_head], "!", 2);*/
+ }
+ memcpy(&in_buffer[in_buffer_tail],info,sizeof(in_info));
+ in_buffer_tail++;
+ if ( in_buffer_tail == BUFFER_LEN )
+ in_buffer_tail=0;
+ spin_unlock_irqrestore( &in_lock, lock_flags );
+ return 1;
+}
+
+/*
+void in_zero_buffer()
+{
+ int i;
+ for (i=0; i < BUFFER_LEN; i++)
+ {
+ memset(&in_buffer[i], 0, sizeof(in_info));
+ }
+ return;
+}
+*/
+
+int in_open_dev( struct inode *in,struct file * fi )
+{
+ MOD_INC_USE_COUNT;
+ add_ignore_ino(in->i_ino);
+#if DEBUG > 1
+ printk("inotify: in_open_dev() %ld\n",in->i_ino);
+#endif
+ return 0;
+}
+
+int in_close_dev( struct inode *in,struct file * fi )
+{
+#if DEBUG > 1
+ printk("inotify: in_close_dev() %ld\n",in->i_ino);
+#endif
+ remove_ignore_ino(in->i_ino);
+ MOD_DEC_USE_COUNT;
+ return 0;
+}
+
+/*ssize_t changedfiles_read_dev( struct inode *in,
+ struct file *fi,
+ char * buf,
+ unsigned long count ) */
+ssize_t in_read_dev( struct file *filep, char *buf, size_t count,loff_t *f_pos )
+{
+ in_info read_buf;
+ if(!in_get_from_buffer(&read_buf))
+ return 0;
+#if DEBUG>2
+ printk("inotify: got info from buffer\n");
+#endif
+ if(count>sizeof(in_info))
+ count=sizeof(in_info);
+ if(copy_to_user(buf,&read_buf,count))
+ {
+ printk("inotify: copy_to_user failed\n");
+ return -EFAULT;
+ }
+#if DEBUG>2
+ printk("inotify: changedfiles_read_dev() returning");
+#endif
+ return count;
+}
+
+static struct file_operations in_fop = {
+ read: in_read_dev,
+ open: in_open_dev,
+ release: in_close_dev,
+};
+
+/*
+ * This function should be called whenever something changes on an inode
+ * where we do not have the dentry, such as reading and writing
+*/
+void inotify_inodechange(struct inode *inode, unsigned long event)
+{
+ in_info info;
+ memset(&info,0,sizeof(in_info));
+ if(test_ignore_ino(inode->i_ino))
+ return;
+ info.event=event;
+ info.file_ino=inode->i_ino;
+ info.src_ino=0;
+ info.dst_ino=0;
+ in_put_to_buffer(&info);
+}
+
+/*
+ * This function should be called when something changes about a dentry, such
+ * as attributes, creating, deleting, renaming etc.
+ */
+void inotify_dentrychange(struct dentry *dentry,unsigned long event)
+{
+ in_info info;
+ struct dentry *parent;
+ memset(&info,0,sizeof(in_info));
+ info.event=event;
+ spin_lock(&dentry->d_lock);
+ if(dentry->d_inode)
+ info.file_ino=dentry->d_inode->i_ino;
+ else
+ info.file_ino=0;
+ if(test_ignore_ino(info.file_ino))
+ goto ignore;
+ parent=dentry->d_parent;
+ if(parent!=dentry)
+ {
+ dget(parent);
+ info.src_ino=parent->d_inode->i_ino;
+ dput(parent);
+ }
+ else
+ info.src_ino=0;
+ if(test_ignore_ino(info.src_ino))
+ goto ignore;
+ info.dst_ino=0;
+ strncpy(info.name,dentry->d_name.name,DNAME_LEN);
+ spin_unlock(&dentry->d_lock);
+ in_put_to_buffer(&info);
+ return;
+ignore:
+ spin_unlock(&dentry->d_lock);
+ return;
+}
+
+/*
+ * This function should be called whenever a dentry is moved (after it is moved)
+ * This one needs a lot of work!
+ */
+void inotify_dentrymove(struct dentry *dentry,struct dentry *dsrc,unsigned long event)
+{
+/* in_info info;
+ struct dentry *parent;
+ memset(&info,0,sizeof(in_info));
+ info.event=event;
+ spin_lock(&dentry->d_lock);
+ if(dentry->d_inode)
+ info.file_ino=dentry->d_inode->i_ino;
+ else
+ info.file_ino=0;
+ parent=dentry->d_parent;
+ if(parent!=dentry)
+ {
+ dget(parent);
+ info.dst_ino=parent->d_inode->i_ino;
+ dput(parent);
+ }
+ else
+ info.dst_ino=0;
+ strncpy(info.name,dentry->d_name.name,DNAME_LEN);
+ spin_unlock(&dentry->d_lock);
+ spin_lock(&dsrc->d_lock);
+ if(dsrc->d_inode)
+ info.src_ino=dsrc->d_inode->i_ino;
+ else
+ info.dst_ino=0;
+ spin_unlock(&dsrc->d_lock);
+ in_put_to_buffer(&info);*/
+}
+
+static int __init inotify_init(void)
+{
+#ifdef DEBUG
+ printk("initializing inotify subsystem...\n");
+#endif
+ int i;
+ for (i=0; i < BUFFER_LEN; i++)
+ {
+ memset(&in_buffer[i], 0, sizeof(in_info));
+ }
+ memset(&in_ignore,0,sizeof(in_ignore));
+ if ( register_chrdev(in_major, "inotify", &in_fop))
+ return -EIO;
+ return 0;
+}
+
+module_init(inotify_init)
diff -urN -X dontdiff vanilla/fs/Makefile develop/fs/Makefile
--- vanilla/fs/Makefile 2003-08-23 01:56:59.000000000 +0200
+++ develop/fs/Makefile 2003-12-31 16:59:36.000000000 +0100
@@ -10,7 +10,7 @@
namei.o fcntl.o ioctl.o readdir.o select.o fifo.o locks.o \
dcache.o inode.o attr.o bad_inode.o file.o dnotify.o \
filesystems.o namespace.o seq_file.o xattr.o libfs.o \
- fs-writeback.o mpage.o direct-io.o aio.o
+ fs-writeback.o mpage.o direct-io.o aio.o inotify.o

obj-$(CONFIG_EPOLL) += eventpoll.o
obj-$(CONFIG_COMPAT) += compat.o
diff -urN -X dontdiff vanilla/include/linux/dnotify.h develop/include/linux/dnotify.h
--- vanilla/include/linux/dnotify.h 2003-04-07 19:30:34.000000000 +0200
+++ develop/include/linux/dnotify.h 2003-12-31 16:59:43.000000000 +0100
@@ -22,6 +22,8 @@

static inline void inode_dir_notify(struct inode *inode, unsigned long event)
{
+ /* call inotify for this inode */
+ inotify_inodechange(inode,event);
if ((inode)->i_dnotify_mask & (event))
__inode_dir_notify(inode, event);
}
diff -urN -X dontdiff vanilla/include/linux/inotify.h develop/include/linux/inotify.h
--- vanilla/include/linux/inotify.h 1970-01-01 01:00:00.000000000 +0100
+++ develop/include/linux/inotify.h 2003-12-31 16:59:43.000000000 +0100
@@ -0,0 +1,17 @@
+/*
+ * Inode notification for Linux
+ *
+ * Copyright (C) 2003,2004 Rüdiger Klaehn
+ */
+
+#include <linux/fs.h>
+#define IN_ACCESS 0x00000001 /* Node accessed */
+#define IN_MODIFY 0x00000002 /* Node modified */
+#define IN_CREATE 0x00000004 /* Node created */
+#define IN_DELETE 0x00000008 /* Node removed */
+#define IN_RENAME 0x00000010 /* Node renamed */
+#define IN_ATTRIB 0x00000020 /* Node changed attibutes */
+
+extern void inotify_inodechange(struct inode *inode, unsigned long event);
+extern void inotify_dentrychange(struct dentry *dentry,unsigned long event);
+extern void inotify_dentrymove(struct dentry *dentry,struct dentry *dsrc,unsigned long event);