@HUST张友东 work@taobao zyd_com@126.com
分类: 服务器与存储
2010-02-01 13:48:03
fuse为开发者提供了两组接口,分别是fuse_lowlevel_ops以及fuse_operations,开发者只需要实现这两组接口的一种即可实现一个用户空间文件系统。
struct fuse_lowlevel_ops的成员如下所示,其中init方法在其它所有方法之前调用,用于初始化文件系统,fuse已经实现,destroy则是在文件系统被卸载时做一些清理工作。用于大多数请求的参数都是fuse_ino_t类型的ino,而文件系统提供给用户的视图是以文件名呈现的,故lookup是实现文件系统的关键,它在parent中查找名字name对应的文件,并返回相应的信息,可使用fuse_reply_entry或fuse_reply_err作为请求的返回。
接口中的方法对于了解过VFS的人应该都不难理解,只要按需实现这些接口,你就可以定制出属于自己的文件系统,这组接口的详细说明见fuse_lowlevel.h。
void(* |
)(void *userdata, struct *conn) |
void(* |
)(void *userdata) |
void(* |
)( req, parent, const char *name) |
void(* |
)( req, ino, unsigned long nlookup) |
void(* |
)( req, ino, struct *fi) |
void(* |
)( req, ino, struct stat *attr, int to_set, struct *fi) |
void(* |
)( req, ino) |
void(* |
)( req, parent, const char *name, mode_t mode, dev_t rdev) |
void(* |
)( req, parent, const char *name, mode_t mode) |
void(* |
)( req, parent, const char *name) |
void(* |
)( req, parent, const char *name) |
void(* |
)( req, const char *, parent, const char *name) |
void(* |
)( req, parent, const char *name, newparent, const char *newname) |
void(* |
)( req, ino, newparent, const char *newname) |
void(* |
)( req, ino, struct *fi) |
void(* |
)( req, ino, size_t size, off_t off, struct *fi) |
void(* |
)( req, ino, const char *buf, size_t size, off_t off, struct *fi) |
void(* |
)( req, ino, struct *fi) |
void(* |
)( req, ino, struct *fi) |
void(* |
)( req, ino, int datasync, struct *fi) |
void(* |
)( req, ino, struct *fi) |
void(* |
)( req, ino, size_t size, off_t off, struct *fi) |
void(* |
)( req, ino, struct *fi) |
void(* |
)( req, ino, int datasync, struct *fi) |
void(* |
)( req, ino) |
void(* |
)( req, ino, const char *name, const char *value, size_t size, int flags) |
void(* |
)( req, ino, const char *name, size_t size) |
void(* |
)( req, ino, size_t size) |
void(* |
)( req, ino, const char *name) |
void(* |
)( req, ino, int mask) |
void(* |
)( req, parent, const char *name, mode_t mode, struct *fi) |
void(* |
)( req, ino, struct *fi, struct flock *lock) |
void(* |
)( req, ino, struct *fi, struct flock *lock, int sleep) |
void(* |
)( req, ino, size_t blocksize, uint64_t idx) |
void(* |
)( req, ino, int cmd, void *arg, struct *fi, unsigned *flagsp, const void *in_buf, size_t in_bufsz, size_t out_bufszp) |
void(* |
)( req, ino, struct *fi, struct fuse_pollhandle *ph) |
用户实现的接口是如何跟这个结构关联起来的?
其实fuse中已经实现了一组接口,在fuse_lowlevel.c中,定义了一个静态的结构数组,该数组的元素为一组(函数,名字)的结构,但没做什么实际的工作,当fuse用户空间的daemon从/fuse/dev中读取到请求之后,它通过请求号来判别各个请求,并调用这里相应的处理函数,如读取到read调用时,会调用do_read进行处理。
static struct {
void (*func)(fuse_req_t, fuse_ino_t, const void *);
const char *name;
} fuse_ll_ops[] = {
//只列举了部分
[FUSE_LOOKUP] = { do_lookup, "LOOKUP" },
[FUSE_OPEN] = { do_open, "OPEN" },
[FUSE_READ] = { do_read, "READ" },
[FUSE_WRITE] = { do_write, "WRITE" },
[FUSE_STATFS] = { do_statfs, "STATFS" },
[FUSE_FLUSH] = { do_flush, "FLUSH" },
[FUSE_INIT] = { do_init, "INIT" },
[FUSE_OPENDIR] = { do_opendir, "OPENDIR" },
[FUSE_READDIR] = { do_readdir, "READDIR" },
[FUSE_RELEASEDIR] = { do_releasedir, "RELEASEDIR" },
[FUSE_DESTROY] = { do_destroy, "DESTROY" }
};
接下来看一下do_read的实现
static void do_read(fuse_req_t req, fuse_ino_t nodeid, const void *inarg)
{
struct fuse_read_in *arg = (struct fuse_read_in *) inarg;
// 如果用户实现了read操作,则调用用户空间的read,否则以没有实现该调用为错误响应,这里的op就是用户实现文件系统时实现的,并传递给fuse。
if (req->f->op.read) {
struct fuse_file_info fi;
memset(&fi, 0, sizeof(fi));
fi.fh = arg->fh;
fi.fh_old = fi.fh;
req->f->op.read(req, nodeid, arg->size, arg->offset, &fi);
} else
fuse_reply_err(req, ENOSYS);
}
从这里的实现可以看出,这些操作是没有加任何锁的,如果开发者需要文件系统锁,需要在实现文件系统时自行考虑。
fuse_operations又是怎么一回事?
对于实现fuse_lowlevel_ops这组接口,没有内核VFS相关知识的开发者是不可能完成的,为了增强fuse的通用性,使更多的用户能够使用fuse开发文件系统,fuse提供了一组更简单的接口fuse_operations,详细说明请参考fuse.h。这组接口的参数跟unix提供的系统调用的参数很类似,开发者更易理解,fuse想开发者屏蔽了底层的相关对象,直接以文件名作为参数,只有开发者按照自己的方式,把这组接口实现就可以,显然这比上面那组接口的实现要简单得多。
int(* |
)(const char *, struct stat *) |
int(* |
)(const char *, char *, size_t) |
int(* |
)(const char *, mode_t, dev_t) |
int(* |
)(const char *, mode_t) |
int(* |
)(const char *) |
int(* |
)(const char *) |
int(* |
)(const char *, const char *) |
int(* |
)(const char *, const char *) |
int(* |
)(const char *, const char *) |
int(* |
)(const char *, mode_t) |
int(* |
)(const char *, uid_t, gid_t) |
int(* |
)(const char *, off_t) |
int(* |
)(const char *, struct utimbuf *) |
int(* |
)(const char *, struct *) |
int(* |
)(const char *, char *, size_t, off_t, struct *) |
int(* |
)(const char *, const char *, size_t, off_t, struct *) |
int(* |
)(const char *, struct statvfs *) |
int(* |
)(const char *, struct *) |
int(* |
)(const char *, struct *) |
int(* |
)(const char *, int, struct *) |
int(* |
)(const char *, const char *, const char *, size_t, int) |
int(* |
)(const char *, const char *, char *, size_t) |
int(* |
)(const char *, char *, size_t) |
int(* |
)(const char *, const char *) |
int(* |
)(const char *, struct *) |
int(* |
)(const char *, void *, , off_t, struct *) |
int(* |
)(const char *, struct *) |
int(* |
)(const char *, int, struct *) |
void *(* |
)(struct *conn) |
void(* |
)(void *) |
int(* |
)(const char *, int) |
int(* |
)(const char *, mode_t, struct *) |
int(* |
)(const char *, off_t, struct *) |
int(* |
)(const char *, struct stat *, struct *) |
int(* |
)(const char *, struct *, int cmd, struct flock *) |
int(* |
)(const char *, const struct timespec tv[2]) |
int(* |
)(const char *, size_t blocksize, uint64_t *idx) |
unsigned int |
: 1 |
unsigned int |
: 31 |
int(* |
)(const char *, int cmd, void *arg, struct *, unsigned int flags, void *data) |
int(* |
)(const char *, struct *, struct fuse_pollhandle *ph, unsigned *reventsp) |
提供这组接口,fuse做了什么?
fuse还是实现了一组fuse_lowlevel_ops的接口,在fuse.c中
static struct fuse_lowlevel_ops fuse_path_ops = {
//只列举了部分方法
.init = fuse_lib_init,
.destroy = fuse_lib_destroy,
.lookup = fuse_lib_lookup,
.forget = fuse_lib_forget,
.getattr = fuse_lib_getattr,
.setattr = fuse_lib_setattr,
.access = fuse_lib_access,
.read = fuse_lib_read,
.readlink = fuse_lib_readlink
};
fuse实现的这组接口跟之前的方法不一样,不是什么都不做,它完成了部分工作,主要是文件节点与文件名的转换关系,然后将文件名作为参数,调用用户实现的fuse_operations的接口。
如fuse_lib_read的实现
int fuse_fs_read(struct fuse_fs *fs, const char *path, char *buf, size_t size,
off_t off, struct fuse_file_info *fi)
{
fuse_get_context()->private_data = fs->user_data;
//用户实现的方法
if (fs->op.read)
return fs->op.read(path, buf, size, off, fi);
else
return -ENOSYS;
}
static void fuse_lib_read(fuse_req_t req, fuse_ino_t ino, size_t size,
off_t off, struct fuse_file_info *fi)
{
struct fuse *f = req_fuse_prepare(req);
char *path;
char *buf;
int res;
buf = (char *) malloc(size);
if (buf == NULL) {
reply_err(req, -ENOMEM);
return;
}
res = -ENOENT;
pthread_rwlock_rdlock(&f->tree_lock); //fuse_operations使用了读写锁
//由ino获取path
path = get_path(f, ino);
if (path != NULL) {
struct fuse_intr_data d;
if (f->conf.debug)
fprintf(stderr, "READ[%llu] %lu bytes from %llu\n",
(unsigned long long) fi->fh, (unsigned long) size,
(unsigned long long) off);
fuse_prepare_interrupt(f, req, &d);
res = fuse_fs_read(f->fs, path, buf, size, off, fi); //通过这个方法调用用户实现的方法
fuse_finish_interrupt(f, req, &d);
free(path);
}
pthread_rwlock_unlock(&f->tree_lock);
if (res >= 0) {
if (f->conf.debug)
fprintf(stderr, " READ[%llu] %u bytes\n",
(unsigned long long)fi->fh, res);
if ((size_t) res > size)
fprintf(stderr, "fuse: read too many bytes");
fuse_reply_buf(req, buf, res); //返回结果
} else
reply_err(req, res);
free(buf);
从上面的代码可以看出,fuse对fuse_operations这组操作使用的是读写锁,而不是互斥量,这样有利于提升文件系统执行效率。当读写锁是写加锁状态时,在它被解锁之前,所有试图对这个锁加锁的线程都会被阻塞。当读写锁在读加锁状态时,所有试图以读模式对它进行加锁的线程都可以获得访问权,但是如果线程希望以写模式对此锁加锁,它必须阻塞直到所有的线程释放读锁。在不同的系统上读写锁的实现可能各不相同,但当读写锁处于读模式锁住状态时,如果有另外线程试图以写模式加锁时,读写锁通常会阻塞接下来的读模式锁请求,以避免读模式锁被长期占用,导致写模式锁请求很长时间不能被满足。