[PATCH 04/16] GFS: core fs

From: David Teigland (teigland_at_redhat.com)
Date: 10/10/05

  • Next message: Greg KH: "Re: [PATCH 11/16] GFS: mount and tuning options"
    Date:	Mon, 10 Oct 2005 16:01:29 -0500
    To: linux-kernel@vger.kernel.org
    
    

    --- a/fs/gfs2/ops_dentry.c 1969-12-31 17:00:00.000000000 -0700
    +++ b/fs/gfs2/ops_dentry.c 2005-10-10 11:28:49.271790845 -0500
    @@ -0,0 +1,117 @@
    +/*
    + * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
    + * Copyright (C) 2004-2005 Red Hat, Inc. All rights reserved.
    + *
    + * This copyrighted material is made available to anyone wishing to use,
    + * modify, copy, or redistribute it subject to the terms and conditions
    + * of the GNU General Public License v.2.
    + */
    +
    +#include <linux/sched.h>
    +#include <linux/slab.h>
    +#include <linux/spinlock.h>
    +#include <linux/completion.h>
    +#include <linux/buffer_head.h>
    +#include <linux/smp_lock.h>
    +#include <asm/semaphore.h>
    +
    +#include "gfs2.h"
    +#include "dir.h"
    +#include "glock.h"
    +#include "ops_dentry.h"
    +
    +/**
    + * gfs2_drevalidate - Check directory lookup consistency
    + * @dentry: the mapping to check
    + * @nd:
    + *
    + * Check to make sure the lookup necessary to arrive at this inode from its
    + * parent is still good.
    + *
    + * Returns: 1 if the dentry is ok, 0 if it isn't
    + */
    +
    +static int gfs2_drevalidate(struct dentry *dentry, struct nameidata *nd)
    +{
    + struct dentry *parent = dget_parent(dentry);
    + struct gfs2_inode *dip = get_v2ip(parent->d_inode);
    + struct gfs2_sbd *sdp = dip->i_sbd;
    + struct inode *inode;
    + struct gfs2_holder d_gh;
    + struct gfs2_inode *ip;
    + struct gfs2_inum inum;
    + unsigned int type;
    + int error;
    +
    + lock_kernel();
    +
    + atomic_inc(&sdp->sd_ops_dentry);
    +
    + inode = dentry->d_inode;
    + if (inode && is_bad_inode(inode))
    + goto invalid;
    +
    + error = gfs2_glock_nq_init(dip->i_gl, LM_ST_SHARED, 0, &d_gh);
    + if (error)
    + goto fail;
    +
    + error = gfs2_dir_search(dip, &dentry->d_name, &inum, &type);
    + switch (error) {
    + case 0:
    + if (!inode)
    + goto invalid_gunlock;
    + break;
    + case -ENOENT:
    + if (!inode)
    + goto valid_gunlock;
    + goto invalid_gunlock;
    + default:
    + goto fail_gunlock;
    + }
    +
    + ip = get_v2ip(inode);
    +
    + if (!gfs2_inum_equal(&ip->i_num, &inum))
    + goto invalid_gunlock;
    +
    + if (IF2DT(ip->i_di.di_mode) != type) {
    + gfs2_consist_inode(dip);
    + goto fail_gunlock;
    + }
    +
    + valid_gunlock:
    + gfs2_glock_dq_uninit(&d_gh);
    +
    + valid:
    + unlock_kernel();
    + dput(parent);
    + return 1;
    +
    + invalid_gunlock:
    + gfs2_glock_dq_uninit(&d_gh);
    +
    + invalid:
    + if (inode && S_ISDIR(inode->i_mode)) {
    + if (have_submounts(dentry))
    + goto valid;
    + shrink_dcache_parent(dentry);
    + }
    + d_drop(dentry);
    +
    + unlock_kernel();
    + dput(parent);
    + return 0;
    +
    + fail_gunlock:
    + gfs2_glock_dq_uninit(&d_gh);
    +
    + fail:
    + unlock_kernel();
    + dput(parent);
    + return 0;
    +}
    +
    +struct dentry_operations gfs2_dops = {
    + .d_revalidate = gfs2_drevalidate,
    +};
    +
    --- a/fs/gfs2/ops_dentry.h 1969-12-31 17:00:00.000000000 -0700
    +++ b/fs/gfs2/ops_dentry.h 2005-10-10 11:28:49.277789909 -0500
    @@ -0,0 +1,15 @@
    +/*
    + * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
    + * Copyright (C) 2004-2005 Red Hat, Inc. All rights reserved.
    + *
    + * This copyrighted material is made available to anyone wishing to use,
    + * modify, copy, or redistribute it subject to the terms and conditions
    + * of the GNU General Public License v.2.
    + */
    +
    +#ifndef __OPS_DENTRY_DOT_H__
    +#define __OPS_DENTRY_DOT_H__
    +
    +extern struct dentry_operations gfs2_dops;
    +
    +#endif /* __OPS_DENTRY_DOT_H__ */
    --- a/fs/gfs2/ops_export.c 1969-12-31 17:00:00.000000000 -0700
    +++ b/fs/gfs2/ops_export.c 2005-10-10 11:28:49.280789442 -0500
    @@ -0,0 +1,310 @@
    +/*
    + * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
    + * Copyright (C) 2004-2005 Red Hat, Inc. All rights reserved.
    + *
    + * This copyrighted material is made available to anyone wishing to use,
    + * modify, copy, or redistribute it subject to the terms and conditions
    + * of the GNU General Public License v.2.
    + */
    +
    +#include <linux/sched.h>
    +#include <linux/slab.h>
    +#include <linux/spinlock.h>
    +#include <linux/completion.h>
    +#include <linux/buffer_head.h>
    +#include <asm/semaphore.h>
    +
    +#include "gfs2.h"
    +#include "dir.h"
    +#include "glock.h"
    +#include "glops.h"
    +#include "inode.h"
    +#include "ops_export.h"
    +#include "rgrp.h"
    +
    +static struct dentry *gfs2_decode_fh(struct super_block *sb,
    + __u32 *fh,
    + int fh_len,
    + int fh_type,
    + int (*acceptable)(void *context,
    + struct dentry *dentry),
    + void *context)
    +{
    + struct gfs2_inum this, parent;
    +
    + atomic_inc(&get_v2sdp(sb)->sd_ops_export);
    +
    + if (fh_type != fh_len)
    + return NULL;
    +
    + memset(&parent, 0, sizeof(struct gfs2_inum));
    +
    + switch (fh_type) {
    + case 8:
    + parent.no_formal_ino = ((uint64_t)le32_to_cpu(fh[4])) << 32;
    + parent.no_formal_ino |= le32_to_cpu(fh[5]);
    + parent.no_addr = ((uint64_t)le32_to_cpu(fh[6])) << 32;
    + parent.no_addr |= le32_to_cpu(fh[7]);
    + case 4:
    + this.no_formal_ino = ((uint64_t)le32_to_cpu(fh[0])) << 32;
    + this.no_formal_ino |= le32_to_cpu(fh[1]);
    + this.no_addr = ((uint64_t)le32_to_cpu(fh[2])) << 32;
    + this.no_addr |= le32_to_cpu(fh[3]);
    + break;
    + default:
    + return NULL;
    + }
    +
    + return gfs2_export_ops.find_exported_dentry(sb, &this, &parent,
    + acceptable, context);
    +}
    +
    +static int gfs2_encode_fh(struct dentry *dentry, __u32 *fh, int *len,
    + int connectable)
    +{
    + struct inode *inode = dentry->d_inode;
    + struct gfs2_inode *ip = get_v2ip(inode);
    + struct gfs2_sbd *sdp = ip->i_sbd;
    +
    + atomic_inc(&sdp->sd_ops_export);
    +
    + if (*len < 4 || (connectable && *len < 8))
    + return 255;
    +
    + fh[0] = ip->i_num.no_formal_ino >> 32;
    + fh[0] = cpu_to_le32(fh[0]);
    + fh[1] = ip->i_num.no_formal_ino & 0xFFFFFFFF;
    + fh[1] = cpu_to_le32(fh[1]);
    + fh[2] = ip->i_num.no_addr >> 32;
    + fh[2] = cpu_to_le32(fh[2]);
    + fh[3] = ip->i_num.no_addr & 0xFFFFFFFF;
    + fh[3] = cpu_to_le32(fh[3]);
    + *len = 4;
    +
    + if (!connectable || ip == sdp->sd_root_dir)
    + return *len;
    +
    + spin_lock(&dentry->d_lock);
    + inode = dentry->d_parent->d_inode;
    + ip = get_v2ip(inode);
    + gfs2_inode_hold(ip);
    + spin_unlock(&dentry->d_lock);
    +
    + fh[4] = ip->i_num.no_formal_ino >> 32;
    + fh[4] = cpu_to_le32(fh[4]);
    + fh[5] = ip->i_num.no_formal_ino & 0xFFFFFFFF;
    + fh[5] = cpu_to_le32(fh[5]);
    + fh[6] = ip->i_num.no_addr >> 32;
    + fh[6] = cpu_to_le32(fh[6]);
    + fh[7] = ip->i_num.no_addr & 0xFFFFFFFF;
    + fh[7] = cpu_to_le32(fh[7]);
    + *len = 8;
    +
    + gfs2_inode_put(ip);
    +
    + return *len;
    +}
    +
    +struct get_name_filldir {
    + struct gfs2_inum inum;
    + char *name;
    +};
    +
    +static int get_name_filldir(void *opaque, const char *name, unsigned int length,
    + uint64_t offset, struct gfs2_inum *inum,
    + unsigned int type)
    +{
    + struct get_name_filldir *gnfd = (struct get_name_filldir *)opaque;
    +
    + if (!gfs2_inum_equal(inum, &gnfd->inum))
    + return 0;
    +
    + memcpy(gnfd->name, name, length);
    + gnfd->name[length] = 0;
    +
    + return 1;
    +}
    +
    +static int gfs2_get_name(struct dentry *parent, char *name,
    + struct dentry *child)
    +{
    + struct inode *dir = parent->d_inode;
    + struct inode *inode = child->d_inode;
    + struct gfs2_inode *dip, *ip;
    + struct get_name_filldir gnfd;
    + struct gfs2_holder gh;
    + uint64_t offset = 0;
    + int error;
    +
    + if (!dir)
    + return -EINVAL;
    +
    + atomic_inc(&get_v2sdp(dir->i_sb)->sd_ops_export);
    +
    + if (!S_ISDIR(dir->i_mode) || !inode)
    + return -EINVAL;
    +
    + dip = get_v2ip(dir);
    + ip = get_v2ip(inode);
    +
    + *name = 0;
    + gnfd.inum = ip->i_num;
    + gnfd.name = name;
    +
    + error = gfs2_glock_nq_init(dip->i_gl, LM_ST_SHARED, 0, &gh);
    + if (error)
    + return error;
    +
    + error = gfs2_dir_read(dip, &offset, &gnfd, get_name_filldir);
    +
    + gfs2_glock_dq_uninit(&gh);
    +
    + if (!error && !*name)
    + error = -ENOENT;
    +
    + return error;
    +}
    +
    +static struct dentry *gfs2_get_parent(struct dentry *child)
    +{
    + struct gfs2_inode *dip = get_v2ip(child->d_inode);
    + struct qstr dotdot = { .name = "..", .len = 2 };
    + struct gfs2_inode *ip;
    + struct inode *inode;
    + struct dentry *dentry;
    + int error;
    +
    + atomic_inc(&dip->i_sbd->sd_ops_export);
    +
    + error = gfs2_lookupi(dip, &dotdot, 1, &ip);
    + if (error)
    + return ERR_PTR(error);
    +
    + inode = gfs2_ip2v(ip);
    + gfs2_inode_put(ip);
    +
    + if (!inode)
    + return ERR_PTR(-ENOMEM);
    +
    + dentry = d_alloc_anon(inode);
    + if (!dentry) {
    + iput(inode);
    + return ERR_PTR(-ENOMEM);
    + }
    +
    + return dentry;
    +}
    +
    +static struct dentry *gfs2_get_dentry(struct super_block *sb, void *inum_p)
    +{
    + struct gfs2_sbd *sdp = get_v2sdp(sb);
    + struct gfs2_inum *inum = (struct gfs2_inum *)inum_p;
    + struct gfs2_holder i_gh, ri_gh, rgd_gh;
    + struct gfs2_rgrpd *rgd;
    + struct gfs2_inode *ip;
    + struct inode *inode;
    + struct dentry *dentry;
    + int error;
    +
    + atomic_inc(&sdp->sd_ops_export);
    +
    + /* System files? */
    +
    + inode = gfs2_iget(sb, inum);
    + if (inode) {
    + ip = get_v2ip(inode);
    + if (ip->i_num.no_formal_ino != inum->no_formal_ino) {
    + iput(inode);
    + return ERR_PTR(-ESTALE);
    + }
    + goto out_inode;
    + }
    +
    + error = gfs2_glock_nq_num(sdp,
    + inum->no_addr, &gfs2_inode_glops,
    + LM_ST_SHARED, LM_FLAG_ANY | GL_LOCAL_EXCL,
    + &i_gh);
    + if (error)
    + return ERR_PTR(error);
    +
    + error = gfs2_inode_get(i_gh.gh_gl, inum, NO_CREATE, &ip);
    + if (error)
    + goto fail;
    + if (ip)
    + goto out_ip;
    +
    + error = gfs2_rindex_hold(sdp, &ri_gh);
    + if (error)
    + goto fail;
    +
    + error = -EINVAL;
    + rgd = gfs2_blk2rgrpd(sdp, inum->no_addr);
    + if (!rgd)
    + goto fail_rindex;
    +
    + error = gfs2_glock_nq_init(rgd->rd_gl, LM_ST_SHARED, 0, &rgd_gh);
    + if (error)
    + goto fail_rindex;
    +
    + error = -ESTALE;
    + if (gfs2_get_block_type(rgd, inum->no_addr) != GFS2_BLKST_DINODE)
    + goto fail_rgd;
    +
    + gfs2_glock_dq_uninit(&rgd_gh);
    + gfs2_glock_dq_uninit(&ri_gh);
    +
    + error = gfs2_inode_get(i_gh.gh_gl, inum, CREATE, &ip);
    + if (error)
    + goto fail;
    +
    + error = gfs2_inode_refresh(ip);
    + if (error) {
    + gfs2_inode_put(ip);
    + goto fail;
    + }
    +
    + atomic_inc(&sdp->sd_fh2dentry_misses);
    +
    + out_ip:
    + error = -EIO;
    + if (ip->i_di.di_flags & GFS2_DIF_SYSTEM) {
    + gfs2_inode_put(ip);
    + goto fail;
    + }
    +
    + gfs2_glock_dq_uninit(&i_gh);
    +
    + inode = gfs2_ip2v(ip);
    + gfs2_inode_put(ip);
    +
    + if (!inode)
    + return ERR_PTR(-ENOMEM);
    +
    + out_inode:
    + dentry = d_alloc_anon(inode);
    + if (!dentry) {
    + iput(inode);
    + return ERR_PTR(-ENOMEM);
    + }
    +
    + return dentry;
    +
    + fail_rgd:
    + gfs2_glock_dq_uninit(&rgd_gh);
    +
    + fail_rindex:
    + gfs2_glock_dq_uninit(&ri_gh);
    +
    + fail:
    + gfs2_glock_dq_uninit(&i_gh);
    + return ERR_PTR(error);
    +}
    +
    +struct export_operations gfs2_export_ops = {
    + .decode_fh = gfs2_decode_fh,
    + .encode_fh = gfs2_encode_fh,
    + .get_name = gfs2_get_name,
    + .get_parent = gfs2_get_parent,
    + .get_dentry = gfs2_get_dentry,
    +};
    +
    --- a/fs/gfs2/ops_export.h 1969-12-31 17:00:00.000000000 -0700
    +++ b/fs/gfs2/ops_export.h 2005-10-10 11:28:49.281789286 -0500
    @@ -0,0 +1,15 @@
    +/*
    + * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
    + * Copyright (C) 2004-2005 Red Hat, Inc. All rights reserved.
    + *
    + * This copyrighted material is made available to anyone wishing to use,
    + * modify, copy, or redistribute it subject to the terms and conditions
    + * of the GNU General Public License v.2.
    + */
    +
    +#ifndef __OPS_EXPORT_DOT_H__
    +#define __OPS_EXPORT_DOT_H__
    +
    +extern struct export_operations gfs2_export_ops;
    +
    +#endif /* __OPS_EXPORT_DOT_H__ */
    --- a/fs/gfs2/ops_file.c 1969-12-31 17:00:00.000000000 -0700
    +++ b/fs/gfs2/ops_file.c 2005-10-10 11:28:49.293787415 -0500
    @@ -0,0 +1,1521 @@
    +/*
    + * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
    + * Copyright (C) 2004-2005 Red Hat, Inc. All rights reserved.
    + *
    + * This copyrighted material is made available to anyone wishing to use,
    + * modify, copy, or redistribute it subject to the terms and conditions
    + * of the GNU General Public License v.2.
    + */
    +
    +#include <linux/sched.h>
    +#include <linux/slab.h>
    +#include <linux/spinlock.h>
    +#include <linux/completion.h>
    +#include <linux/buffer_head.h>
    +#include <linux/pagemap.h>
    +#include <linux/uio.h>
    +#include <linux/blkdev.h>
    +#include <linux/mm.h>
    +#include <linux/smp_lock.h>
    +#include <linux/gfs2_ioctl.h>
    +#include <asm/semaphore.h>
    +#include <asm/uaccess.h>
    +
    +#include "gfs2.h"
    +#include "bmap.h"
    +#include "dir.h"
    +#include "glock.h"
    +#include "glops.h"
    +#include "inode.h"
    +#include "ioctl.h"
    +#include "jdata.h"
    +#include "lm.h"
    +#include "log.h"
    +#include "meta_io.h"
    +#include "ops_file.h"
    +#include "ops_vm.h"
    +#include "quota.h"
    +#include "rgrp.h"
    +#include "trans.h"
    +
    +/* "bad" is for NFS support */
    +struct filldir_bad_entry {
    + char *fbe_name;
    + unsigned int fbe_length;
    + uint64_t fbe_offset;
    + struct gfs2_inum fbe_inum;
    + unsigned int fbe_type;
    +};
    +
    +struct filldir_bad {
    + struct gfs2_sbd *fdb_sbd;
    +
    + struct filldir_bad_entry *fdb_entry;
    + unsigned int fdb_entry_num;
    + unsigned int fdb_entry_off;
    +
    + char *fdb_name;
    + unsigned int fdb_name_size;
    + unsigned int fdb_name_off;
    +};
    +
    +/* For regular, non-NFS */
    +struct filldir_reg {
    + struct gfs2_sbd *fdr_sbd;
    + int fdr_prefetch;
    +
    + filldir_t fdr_filldir;
    + void *fdr_opaque;
    +};
    +
    +typedef ssize_t(*do_rw_t) (struct file *file,
    + char *buf,
    + size_t size, loff_t *offset,
    + unsigned int num_gh, struct gfs2_holder *ghs);
    +
    +/**
    + * gfs2_llseek - seek to a location in a file
    + * @file: the file
    + * @offset: the offset
    + * @origin: Where to seek from (SEEK_SET, SEEK_CUR, or SEEK_END)
    + *
    + * SEEK_END requires the glock for the file because it references the
    + * file's size.
    + *
    + * Returns: The new offset, or errno
    + */
    +
    +static loff_t gfs2_llseek(struct file *file, loff_t offset, int origin)
    +{
    + struct gfs2_inode *ip = get_v2ip(file->f_mapping->host);
    + struct gfs2_holder i_gh;
    + loff_t error;
    +
    + atomic_inc(&ip->i_sbd->sd_ops_file);
    +
    + if (origin == 2) {
    + error = gfs2_glock_nq_init(ip->i_gl, LM_ST_SHARED, LM_FLAG_ANY,
    + &i_gh);
    + if (!error) {
    + error = remote_llseek(file, offset, origin);
    + gfs2_glock_dq_uninit(&i_gh);
    + }
    + } else
    + error = remote_llseek(file, offset, origin);
    +
    + return error;
    +}
    +
    +static inline unsigned int vma2state(struct vm_area_struct *vma)
    +{
    + if ((vma->vm_flags & (VM_MAYWRITE | VM_MAYSHARE)) ==
    + (VM_MAYWRITE | VM_MAYSHARE))
    + return LM_ST_EXCLUSIVE;
    + return LM_ST_SHARED;
    +}
    +
    +static ssize_t walk_vm_hard(struct file *file, char *buf, size_t size,
    + loff_t *offset, do_rw_t operation)
    +{
    + struct gfs2_holder *ghs;
    + unsigned int num_gh = 0;
    + ssize_t count;
    + struct super_block *sb = file->f_dentry->d_inode->i_sb;
    + struct mm_struct *mm = current->mm;
    + struct vm_area_struct *vma;
    + unsigned long start = (unsigned long)buf;
    + unsigned long end = start + size;
    + int dumping = (current->flags & PF_DUMPCORE);
    + unsigned int x = 0;
    +
    + for (vma = find_vma(mm, start); vma; vma = vma->vm_next) {
    + if (end <= vma->vm_start)
    + break;
    + if (vma->vm_file &&
    + vma->vm_file->f_dentry->d_inode->i_sb == sb) {
    + num_gh++;
    + }
    + }
    +
    + ghs = kcalloc((num_gh + 1), sizeof(struct gfs2_holder), GFP_KERNEL);
    + if (!ghs) {
    + if (!dumping)
    + up_read(&mm->mmap_sem);
    + return -ENOMEM;
    + }
    +
    + for (vma = find_vma(mm, start); vma; vma = vma->vm_next) {
    + if (end <= vma->vm_start)
    + break;
    + if (vma->vm_file) {
    + struct inode *inode = vma->vm_file->f_dentry->d_inode;
    + if (inode->i_sb == sb)
    + gfs2_holder_init(get_v2ip(inode)->i_gl,
    + vma2state(vma), 0, &ghs[x++]);
    + }
    + }
    +
    + if (!dumping)
    + up_read(&mm->mmap_sem);
    +
    + gfs2_assert(get_v2sdp(sb), x == num_gh);
    +
    + count = operation(file, buf, size, offset, num_gh, ghs);
    +
    + while (num_gh--)
    + gfs2_holder_uninit(&ghs[num_gh]);
    + kfree(ghs);
    +
    + return count;
    +}
    +
    +/**
    + * walk_vm - Walk the vmas associated with a buffer for read or write.
    + * If any of them are gfs2, pass the gfs2 inode down to the read/write
    + * worker function so that locks can be acquired in the correct order.
    + * @file: The file to read/write from/to
    + * @buf: The buffer to copy to/from
    + * @size: The amount of data requested
    + * @offset: The current file offset
    + * @operation: The read or write worker function
    + *
    + * Outputs: Offset - updated according to number of bytes written
    + *
    + * Returns: The number of bytes written, errno on failure
    + */
    +
    +static ssize_t walk_vm(struct file *file, char *buf, size_t size,
    + loff_t *offset, do_rw_t operation)
    +{
    + struct gfs2_holder gh;
    +
    + if (current->mm) {
    + struct super_block *sb = file->f_dentry->d_inode->i_sb;
    + struct mm_struct *mm = current->mm;
    + struct vm_area_struct *vma;
    + unsigned long start = (unsigned long)buf;
    + unsigned long end = start + size;
    + int dumping = (current->flags & PF_DUMPCORE);
    +
    + if (!dumping)
    + down_read(&mm->mmap_sem);
    +
    + for (vma = find_vma(mm, start); vma; vma = vma->vm_next) {
    + if (end <= vma->vm_start)
    + break;
    + if (vma->vm_file &&
    + vma->vm_file->f_dentry->d_inode->i_sb == sb)
    + goto do_locks;
    + }
    +
    + if (!dumping)
    + up_read(&mm->mmap_sem);
    + }
    +
    + return operation(file, buf, size, offset, 0, &gh);
    +
    + do_locks:
    + return walk_vm_hard(file, buf, size, offset, operation);
    +}
    +
    +static ssize_t do_jdata_read(struct file *file, char *buf, size_t size,
    + loff_t *offset)
    +{
    + struct gfs2_inode *ip = get_v2ip(file->f_mapping->host);
    + ssize_t count = 0;
    +
    + if (*offset < 0)
    + return -EINVAL;
    + if (!access_ok(VERIFY_WRITE, buf, size))
    + return -EFAULT;
    +
    + if (!(file->f_flags & O_LARGEFILE)) {
    + if (*offset >= MAX_NON_LFS)
    + return -EFBIG;
    + if (*offset + size > MAX_NON_LFS)
    + size = MAX_NON_LFS - *offset;
    + }
    +
    + count = gfs2_jdata_read(ip, buf, *offset, size, gfs2_copy2user);
    +
    + if (count > 0)
    + *offset += count;
    +
    + return count;
    +}
    +
    +/**
    + * do_read_direct - Read bytes from a file
    + * @file: The file to read from
    + * @buf: The buffer to copy into
    + * @size: The amount of data requested
    + * @offset: The current file offset
    + * @num_gh: The number of other locks we need to do the read
    + * @ghs: the locks we need plus one for our lock
    + *
    + * Outputs: Offset - updated according to number of bytes read
    + *
    + * Returns: The number of bytes read, errno on failure
    + */
    +
    +static ssize_t do_read_direct(struct file *file, char *buf, size_t size,
    + loff_t *offset, unsigned int num_gh,
    + struct gfs2_holder *ghs)
    +{
    + struct inode *inode = file->f_mapping->host;
    + struct gfs2_inode *ip = get_v2ip(inode);
    + unsigned int state = LM_ST_DEFERRED;
    + int flags = 0;
    + unsigned int x;
    + ssize_t count = 0;
    + int error;
    +
    + for (x = 0; x < num_gh; x++)
    + if (ghs[x].gh_gl == ip->i_gl) {
    + state = LM_ST_SHARED;
    + flags |= GL_LOCAL_EXCL;
    + break;
    + }
    +
    + gfs2_holder_init(ip->i_gl, state, flags, &ghs[num_gh]);
    +
    + error = gfs2_glock_nq_m(num_gh + 1, ghs);
    + if (error)
    + goto out;
    +
    + error = -EINVAL;
    + if (gfs2_is_jdata(ip))
    + goto out_gunlock;
    +
    + if (gfs2_is_stuffed(ip)) {
    + size_t mask = bdev_hardsect_size(inode->i_sb->s_bdev) - 1;
    +
    + if (((*offset) & mask) || (((unsigned long)buf) & mask))
    + goto out_gunlock;
    +
    + count = do_jdata_read(file, buf, size & ~mask, offset);
    + } else
    + count = generic_file_read(file, buf, size, offset);
    +
    + error = 0;
    +
    + out_gunlock:
    + gfs2_glock_dq_m(num_gh + 1, ghs);
    +
    + out:
    + gfs2_holder_uninit(&ghs[num_gh]);
    +
    + return (count) ? count : error;
    +}
    +
    +/**
    + * do_read_buf - Read bytes from a file
    + * @file: The file to read from
    + * @buf: The buffer to copy into
    + * @size: The amount of data requested
    + * @offset: The current file offset
    + * @num_gh: The number of other locks we need to do the read
    + * @ghs: the locks we need plus one for our lock
    + *
    + * Outputs: Offset - updated according to number of bytes read
    + *
    + * Returns: The number of bytes read, errno on failure
    + */
    +
    +static ssize_t do_read_buf(struct file *file, char *buf, size_t size,
    + loff_t *offset, unsigned int num_gh,
    + struct gfs2_holder *ghs)
    +{
    + struct gfs2_inode *ip = get_v2ip(file->f_mapping->host);
    + ssize_t count = 0;
    + int error;
    +
    + gfs2_holder_init(ip->i_gl, LM_ST_SHARED, GL_ATIME, &ghs[num_gh]);
    +
    + error = gfs2_glock_nq_m_atime(num_gh + 1, ghs);
    + if (error)
    + goto out;
    +
    + if (gfs2_is_jdata(ip) ||
    + (gfs2_is_stuffed(ip) && !test_bit(GIF_PAGED, &ip->i_flags)))
    + count = do_jdata_read(file, buf, size, offset);
    + else
    + count = generic_file_read(file, buf, size, offset);
    +
    + gfs2_glock_dq_m(num_gh + 1, ghs);
    +
    + out:
    + gfs2_holder_uninit(&ghs[num_gh]);
    +
    + return (count) ? count : error;
    +}
    +
    +/**
    + * gfs2_read - Read bytes from a file
    + * @file: The file to read from
    + * @buf: The buffer to copy into
    + * @size: The amount of data requested
    + * @offset: The current file offset
    + *
    + * Outputs: Offset - updated according to number of bytes read
    + *
    + * Returns: The number of bytes read, errno on failure
    + */
    +
    +static ssize_t gfs2_read(struct file *file, char *buf, size_t size,
    + loff_t *offset)
    +{
    + atomic_inc(&get_v2sdp(file->f_mapping->host->i_sb)->sd_ops_file);
    +
    + if (file->f_flags & O_DIRECT)
    + return walk_vm(file, buf, size, offset, do_read_direct);
    + else
    + return walk_vm(file, buf, size, offset, do_read_buf);
    +}
    +
    +/**
    + * grope_mapping - feel up a mapping that needs to be written
    + * @buf: the start of the memory to be written
    + * @size: the size of the memory to be written
    + *
    + * We do this after acquiring the locks on the mapping,
    + * but before starting the write transaction. We need to make
    + * sure that we don't cause recursive transactions if blocks
    + * need to be allocated to the file backing the mapping.
    + *
    + * Returns: errno
    + */
    +
    +static int grope_mapping(char *buf, size_t size)
    +{
    + unsigned long start = (unsigned long)buf;
    + unsigned long stop = start + size;
    + char c;
    +
    + while (start < stop) {
    + if (copy_from_user(&c, (char *)start, 1))
    + return -EFAULT;
    + start += PAGE_CACHE_SIZE;
    + start &= PAGE_CACHE_MASK;
    + }
    +
    + return 0;
    +}
    +
    +/**
    + * do_write_direct_alloc - Write bytes to a file
    + * @file: The file to write to
    + * @buf: The buffer to copy from
    + * @size: The amount of data requested
    + * @offset: The current file offset
    + *
    + * Outputs: Offset - updated according to number of bytes written
    + *
    + * Returns: The number of bytes written, errno on failure
    + */
    +
    +static ssize_t do_write_direct_alloc(struct file *file, char *buf, size_t size,
    + loff_t *offset)
    +{
    + struct inode *inode = file->f_mapping->host;
    + struct gfs2_inode *ip = get_v2ip(inode);
    + struct gfs2_sbd *sdp = ip->i_sbd;
    + struct gfs2_alloc *al = NULL;
    + struct iovec local_iov = { .iov_base = buf, .iov_len = size };
    + struct buffer_head *dibh;
    + unsigned int data_blocks, ind_blocks;
    + ssize_t count;
    + int error;
    +
    + gfs2_write_calc_reserv(ip, size, &data_blocks, &ind_blocks);
    +
    + al = gfs2_alloc_get(ip);
    +
    + error = gfs2_quota_lock(ip, NO_QUOTA_CHANGE, NO_QUOTA_CHANGE);
    + if (error)
    + goto fail;
    +
    + error = gfs2_quota_check(ip, ip->i_di.di_uid, ip->i_di.di_gid);
    + if (error)
    + goto fail_gunlock_q;
    +
    + al->al_requested = data_blocks + ind_blocks;
    +
    + error = gfs2_inplace_reserve(ip);
    + if (error)
    + goto fail_gunlock_q;
    +
    + error = gfs2_trans_begin(sdp,
    + al->al_rgd->rd_ri.ri_length + ind_blocks +
    + RES_DINODE + RES_STATFS + RES_QUOTA, 0);
    + if (error)
    + goto fail_ipres;
    +
    + if ((ip->i_di.di_mode & (S_ISUID | S_ISGID)) && !capable(CAP_FSETID)) {
    + error = gfs2_meta_inode_buffer(ip, &dibh);
    + if (error)
    + goto fail_end_trans;
    +
    + ip->i_di.di_mode &= (ip->i_di.di_mode & S_IXGRP) ?
    + (~(S_ISUID | S_ISGID)) : (~S_ISUID);
    +
    + gfs2_trans_add_bh(ip->i_gl, dibh);
    + gfs2_dinode_out(&ip->i_di, dibh->b_data);
    + brelse(dibh);
    + }
    +
    + if (gfs2_is_stuffed(ip)) {
    + error = gfs2_unstuff_dinode(ip, gfs2_unstuffer_sync, NULL);
    + if (error)
    + goto fail_end_trans;
    + }
    +
    + count = generic_file_write_nolock(file, &local_iov, 1, offset);
    + if (count < 0) {
    + error = count;
    + goto fail_end_trans;
    + }
    +
    + error = gfs2_meta_inode_buffer(ip, &dibh);
    + if (error)
    + goto fail_end_trans;
    +
    + if (ip->i_di.di_size < inode->i_size)
    + ip->i_di.di_size = inode->i_size;
    + ip->i_di.di_mtime = ip->i_di.di_ctime = get_seconds();
    +
    + gfs2_trans_add_bh(ip->i_gl, dibh);
    + gfs2_dinode_out(&ip->i_di, dibh->b_data);
    + brelse(dibh);
    +
    + gfs2_trans_end(sdp);
    +
    + if (file->f_flags & O_SYNC)
    + gfs2_log_flush_glock(ip->i_gl);
    +
    + gfs2_inplace_release(ip);
    + gfs2_quota_unlock(ip);
    + gfs2_alloc_put(ip);
    +
    + return count;
    +
    + fail_end_trans:
    + gfs2_trans_end(sdp);
    +
    + fail_ipres:
    + gfs2_inplace_release(ip);
    +
    + fail_gunlock_q:
    + gfs2_quota_unlock(ip);
    +
    + fail:
    + gfs2_alloc_put(ip);
    +
    + return error;
    +}
    +
    +/**
    + * do_write_direct - Write bytes to a file
    + * @file: The file to write to
    + * @buf: The buffer to copy from
    + * @size: The amount of data requested
    + * @offset: The current file offset
    + * @num_gh: The number of other locks we need to do the read
    + * @gh: the locks we need plus one for our lock
    + *
    + * Outputs: Offset - updated according to number of bytes written
    + *
    + * Returns: The number of bytes written, errno on failure
    + */
    +
    +static ssize_t do_write_direct(struct file *file, char *buf, size_t size,
    + loff_t *offset, unsigned int num_gh,
    + struct gfs2_holder *ghs)
    +{
    + struct gfs2_inode *ip = get_v2ip(file->f_mapping->host);
    + struct gfs2_sbd *sdp = ip->i_sbd;
    + struct gfs2_file *fp = get_v2fp(file);
    + unsigned int state = LM_ST_DEFERRED;
    + int alloc_required;
    + unsigned int x;
    + size_t s;
    + ssize_t count = 0;
    + int error;
    +
    + if (test_bit(GFF_DID_DIRECT_ALLOC, &fp->f_flags))
    + state = LM_ST_EXCLUSIVE;
    + else
    + for (x = 0; x < num_gh; x++)
    + if (ghs[x].gh_gl == ip->i_gl) {
    + state = LM_ST_EXCLUSIVE;
    + break;
    + }
    +
    + restart:
    + gfs2_holder_init(ip->i_gl, state, 0, &ghs[num_gh]);
    +
    + error = gfs2_glock_nq_m(num_gh + 1, ghs);
    + if (error)
    + goto out;
    +
    + error = -EINVAL;
    + if (gfs2_is_jdata(ip))
    + goto out_gunlock;
    +
    + if (num_gh) {
    + error = grope_mapping(buf, size);
    + if (error)
    + goto out_gunlock;
    + }
    +
    + if (file->f_flags & O_APPEND)
    + *offset = ip->i_di.di_size;
    +
    + if (!(file->f_flags & O_LARGEFILE)) {
    + error = -EFBIG;
    + if (*offset >= MAX_NON_LFS)
    + goto out_gunlock;
    + if (*offset + size > MAX_NON_LFS)
    + size = MAX_NON_LFS - *offset;
    + }
    +
    + if (gfs2_is_stuffed(ip) ||
    + *offset + size > ip->i_di.di_size ||
    + ((ip->i_di.di_mode & (S_ISUID | S_ISGID)) && !capable(CAP_FSETID)))
    + alloc_required = 1;
    + else {
    + error = gfs2_write_alloc_required(ip, *offset, size,
    + &alloc_required);
    + if (error)
    + goto out_gunlock;
    + }
    +
    + if (alloc_required && state != LM_ST_EXCLUSIVE) {
    + gfs2_glock_dq_m(num_gh + 1, ghs);
    + gfs2_holder_uninit(&ghs[num_gh]);
    + state = LM_ST_EXCLUSIVE;
    + goto restart;
    + }
    +
    + if (alloc_required) {
    + set_bit(GFF_DID_DIRECT_ALLOC, &fp->f_flags);
    +
    + /* split large writes into smaller atomic transactions */
    + while (size) {
    + s = gfs2_tune_get(sdp, gt_max_atomic_write);
    + if (s > size)
    + s = size;
    +
    + error = do_write_direct_alloc(file, buf, s, offset);
    + if (error < 0)
    + goto out_gunlock;
    +
    + buf += error;
    + size -= error;
    + count += error;
    + }
    + } else {
    + struct iovec local_iov = { .iov_base = buf, .iov_len = size };
    + struct gfs2_holder t_gh;
    +
    + clear_bit(GFF_DID_DIRECT_ALLOC, &fp->f_flags);
    +
    + error = gfs2_glock_nq_init(sdp->sd_trans_gl, LM_ST_SHARED,
    + GL_NEVER_RECURSE, &t_gh);
    + if (error)
    + goto out_gunlock;
    +
    + count = generic_file_write_nolock(file, &local_iov, 1, offset);
    +
    + gfs2_glock_dq_uninit(&t_gh);
    + }
    +
    + error = 0;
    +
    + out_gunlock:
    + gfs2_glock_dq_m(num_gh + 1, ghs);
    +
    + out:
    + gfs2_holder_uninit(&ghs[num_gh]);
    +
    + return (count) ? count : error;
    +}
    +
    +/**
    + * do_do_write_buf - Write bytes to a file
    + * @file: The file to write to
    + * @buf: The buffer to copy from
    + * @size: The amount of data requested
    + * @offset: The current file offset
    + *
    + * Outputs: Offset - updated according to number of bytes written
    + *
    + * Returns: The number of bytes written, errno on failure
    + */
    +
    +static ssize_t do_do_write_buf(struct file *file, char *buf, size_t size,
    + loff_t *offset)
    +{
    + struct inode *inode = file->f_mapping->host;
    + struct gfs2_inode *ip = get_v2ip(inode);
    + struct gfs2_sbd *sdp = ip->i_sbd;
    + struct gfs2_alloc *al = NULL;
    + struct buffer_head *dibh;
    + unsigned int data_blocks, ind_blocks;
    + int alloc_required, journaled;
    + ssize_t count;
    + int error;
    +
    + journaled = gfs2_is_jdata(ip);
    +
    + gfs2_write_calc_reserv(ip, size, &data_blocks, &ind_blocks);
    +
    + error = gfs2_write_alloc_required(ip, *offset, size, &alloc_required);
    + if (error)
    + return error;
    +
    + if (alloc_required) {
    + al = gfs2_alloc_get(ip);
    +
    + error = gfs2_quota_lock(ip, NO_QUOTA_CHANGE, NO_QUOTA_CHANGE);
    + if (error)
    + goto fail;
    +
    + error = gfs2_quota_check(ip, ip->i_di.di_uid, ip->i_di.di_gid);
    + if (error)
    + goto fail_gunlock_q;
    +
    + al->al_requested = data_blocks + ind_blocks;
    +
    + error = gfs2_inplace_reserve(ip);
    + if (error)
    + goto fail_gunlock_q;
    +
    + error = gfs2_trans_begin(sdp,
    + al->al_rgd->rd_ri.ri_length +
    + ind_blocks +
    + ((journaled) ? data_blocks : 0) +
    + RES_DINODE + RES_STATFS + RES_QUOTA,
    + 0);
    + if (error)
    + goto fail_ipres;
    + } else {
    + error = gfs2_trans_begin(sdp,
    + ((journaled) ? data_blocks : 0) +
    + RES_DINODE,
    + 0);
    + if (error)
    + goto fail_ipres;
    + }
    +
    + if ((ip->i_di.di_mode & (S_ISUID | S_ISGID)) && !capable(CAP_FSETID)) {
    + error = gfs2_meta_inode_buffer(ip, &dibh);
    + if (error)
    + goto fail_end_trans;
    +
    + ip->i_di.di_mode &= (ip->i_di.di_mode & S_IXGRP) ?
    + (~(S_ISUID | S_ISGID)) : (~S_ISUID);
    +
    + gfs2_trans_add_bh(ip->i_gl, dibh);
    + gfs2_dinode_out(&ip->i_di, dibh->b_data);
    + brelse(dibh);
    + }
    +
    + if (journaled ||
    + (gfs2_is_stuffed(ip) && !test_bit(GIF_PAGED, &ip->i_flags) &&
    + *offset + size <= sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode))) {
    +
    + count = gfs2_jdata_write(ip, buf, *offset, size,
    + gfs2_copy_from_user);
    + if (count < 0) {
    + error = count;
    + goto fail_end_trans;
    + }
    +
    + *offset += count;
    + } else {
    + struct iovec local_iov = { .iov_base = buf, .iov_len = size };
    +
    + count = generic_file_write_nolock(file, &local_iov, 1, offset);
    + if (count < 0) {
    + error = count;
    + goto fail_end_trans;
    + }
    +
    + error = gfs2_meta_inode_buffer(ip, &dibh);
    + if (error)
    + goto fail_end_trans;
    +
    + if (ip->i_di.di_size < inode->i_size)
    + ip->i_di.di_size = inode->i_size;
    + ip->i_di.di_mtime = ip->i_di.di_ctime = get_seconds();
    +
    + gfs2_trans_add_bh(ip->i_gl, dibh);
    + gfs2_dinode_out(&ip->i_di, dibh->b_data);
    + brelse(dibh);
    + }
    +
    + gfs2_trans_end(sdp);
    +
    + if (file->f_flags & O_SYNC)
    + gfs2_log_flush_glock(ip->i_gl);
    +
    + if (alloc_required) {
    + gfs2_assert_warn(sdp, count != size ||
    + al->al_alloced);
    + gfs2_inplace_release(ip);
    + gfs2_quota_unlock(ip);
    + gfs2_alloc_put(ip);
    + }
    +
    + return count;
    +
    + fail_end_trans:
    + gfs2_trans_end(sdp);
    +
    + fail_ipres:
    + if (alloc_required)
    + gfs2_inplace_release(ip);
    +
    + fail_gunlock_q:
    + if (alloc_required)
    + gfs2_quota_unlock(ip);
    +
    + fail:
    + if (alloc_required)
    + gfs2_alloc_put(ip);
    +
    + return error;
    +}
    +
    +/**
    + * do_write_buf - Write bytes to a file
    + * @file: The file to write to
    + * @buf: The buffer to copy from
    + * @size: The amount of data requested
    + * @offset: The current file offset
    + * @num_gh: The number of other locks we need to do the read
    + * @gh: the locks we need plus one for our lock
    + *
    + * Outputs: Offset - updated according to number of bytes written
    + *
    + * Returns: The number of bytes written, errno on failure
    + */
    +
    +static ssize_t do_write_buf(struct file *file, char *buf, size_t size,
    + loff_t *offset, unsigned int num_gh,
    + struct gfs2_holder *ghs)
    +{
    + struct gfs2_inode *ip = get_v2ip(file->f_mapping->host);
    + struct gfs2_sbd *sdp = ip->i_sbd;
    + size_t s;
    + ssize_t count = 0;
    + int error;
    +
    + gfs2_holder_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, &ghs[num_gh]);
    +
    + error = gfs2_glock_nq_m(num_gh + 1, ghs);
    + if (error)
    + goto out;
    +
    + if (num_gh) {
    + error = grope_mapping(buf, size);
    + if (error)
    + goto out_gunlock;
    + }
    +
    + if (file->f_flags & O_APPEND)
    + *offset = ip->i_di.di_size;
    +
    + if (!(file->f_flags & O_LARGEFILE)) {
    + error = -EFBIG;
    + if (*offset >= MAX_NON_LFS)
    + goto out_gunlock;
    + if (*offset + size > MAX_NON_LFS)
    + size = MAX_NON_LFS - *offset;
    + }
    +
    + /* split large writes into smaller atomic transactions */
    + while (size) {
    + s = gfs2_tune_get(sdp, gt_max_atomic_write);
    + if (s > size)
    + s = size;
    +
    + error = do_do_write_buf(file, buf, s, offset);
    + if (error < 0)
    + goto out_gunlock;
    +
    + buf += error;
    + size -= error;
    + count += error;
    + }
    +
    + error = 0;
    +
    + out_gunlock:
    + gfs2_glock_dq_m(num_gh + 1, ghs);
    +
    + out:
    + gfs2_holder_uninit(&ghs[num_gh]);
    +
    + return (count) ? count : error;
    +}
    +
    +/**
    + * gfs2_write - Write bytes to a file
    + * @file: The file to write to
    + * @buf: The buffer to copy from
    + * @size: The amount of data requested
    + * @offset: The current file offset
    + *
    + * Outputs: Offset - updated according to number of bytes written
    + *
    + * Returns: The number of bytes written, errno on failure
    + */
    +
    +static ssize_t gfs2_write(struct file *file, const char *buf, size_t size,
    + loff_t *offset)
    +{
    + struct inode *inode = file->f_mapping->host;
    + ssize_t count;
    +
    + atomic_inc(&get_v2sdp(inode->i_sb)->sd_ops_file);
    +
    + if (*offset < 0)
    + return -EINVAL;
    + if (!access_ok(VERIFY_READ, buf, size))
    + return -EFAULT;
    +
    + down(&inode->i_sem);
    + if (file->f_flags & O_DIRECT)
    + count = walk_vm(file, (char *)buf, size, offset,
    + do_write_direct);
    + else
    + count = walk_vm(file, (char *)buf, size, offset, do_write_buf);
    + up(&inode->i_sem);
    +
    + return count;
    +}
    +
    +/**
    + * filldir_reg_func - Report a directory entry to the caller of gfs2_dir_read()
    + * @opaque: opaque data used by the function
    + * @name: the name of the directory entry
    + * @length: the length of the name
    + * @offset: the entry's offset in the directory
    + * @inum: the inode number the entry points to
    + * @type: the type of inode the entry points to
    + *
    + * Returns: 0 on success, 1 if buffer full
    + */
    +
    +static int filldir_reg_func(void *opaque, const char *name, unsigned int length,
    + uint64_t offset, struct gfs2_inum *inum,
    + unsigned int type)
    +{
    + struct filldir_reg *fdr = (struct filldir_reg *)opaque;
    + struct gfs2_sbd *sdp = fdr->fdr_sbd;
    + int error;
    +
    + error = fdr->fdr_filldir(fdr->fdr_opaque, name, length, offset,
    + inum->no_formal_ino, type);
    + if (error)
    + return 1;
    +
    + if (fdr->fdr_prefetch && !(length == 1 && *name == '.')) {
    + gfs2_glock_prefetch_num(sdp,
    + inum->no_addr, &gfs2_inode_glops,
    + LM_ST_SHARED, LM_FLAG_TRY | LM_FLAG_ANY);
    + gfs2_glock_prefetch_num(sdp,
    + inum->no_addr, &gfs2_iopen_glops,
    + LM_ST_SHARED, LM_FLAG_TRY);
    + }
    +
    + return 0;
    +}
    +
    +/**
    + * readdir_reg - Read directory entries from a directory
    + * @file: The directory to read from
    + * @dirent: Buffer for dirents
    + * @filldir: Function used to do the copying
    + *
    + * Returns: errno
    + */
    +
    +static int readdir_reg(struct file *file, void *dirent, filldir_t filldir)
    +{
    + struct gfs2_inode *dip = get_v2ip(file->f_mapping->host);
    + struct filldir_reg fdr;
    + struct gfs2_holder d_gh;
    + uint64_t offset = file->f_pos;
    + int error;
    +
    + fdr.fdr_sbd = dip->i_sbd;
    + fdr.fdr_prefetch = 1;
    + fdr.fdr_filldir = filldir;
    + fdr.fdr_opaque = dirent;
    +
    + gfs2_holder_init(dip->i_gl, LM_ST_SHARED, GL_ATIME, &d_gh);
    + error = gfs2_glock_nq_atime(&d_gh);
    + if (error) {
    + gfs2_holder_uninit(&d_gh);
    + return error;
    + }
    +
    + error = gfs2_dir_read(dip, &offset, &fdr, filldir_reg_func);
    +
    + gfs2_glock_dq_uninit(&d_gh);
    +
    + file->f_pos = offset;
    +
    + return error;
    +}
    +
    +/**
    + * filldir_bad_func - Report a directory entry to the caller of gfs2_dir_read()
    + * @opaque: opaque data used by the function
    + * @name: the name of the directory entry
    + * @length: the length of the name
    + * @offset: the entry's offset in the directory
    + * @inum: the inode number the entry points to
    + * @type: the type of inode the entry points to
    + *
    + * For supporting NFS.
    + *
    + * Returns: 0 on success, 1 if buffer full
    + */
    +
    +static int filldir_bad_func(void *opaque, const char *name, unsigned int length,
    + uint64_t offset, struct gfs2_inum *inum,
    + unsigned int type)
    +{
    + struct filldir_bad *fdb = (struct filldir_bad *)opaque;
    + struct gfs2_sbd *sdp = fdb->fdb_sbd;
    + struct filldir_bad_entry *fbe;
    +
    + if (fdb->fdb_entry_off == fdb->fdb_entry_num ||
    + fdb->fdb_name_off + length > fdb->fdb_name_size)
    + return 1;
    +
    + fbe = &fdb->fdb_entry[fdb->fdb_entry_off];
    + fbe->fbe_name = fdb->fdb_name + fdb->fdb_name_off;
    + memcpy(fbe->fbe_name, name, length);
    + fbe->fbe_length = length;
    + fbe->fbe_offset = offset;
    + fbe->fbe_inum = *inum;
    + fbe->fbe_type = type;
    +
    + fdb->fdb_entry_off++;
    + fdb->fdb_name_off += length;
    +
    + if (!(length == 1 && *name == '.')) {
    + gfs2_glock_prefetch_num(sdp,
    + inum->no_addr, &gfs2_inode_glops,
    + LM_ST_SHARED, LM_FLAG_TRY | LM_FLAG_ANY);
    + gfs2_glock_prefetch_num(sdp,
    + inum->no_addr, &gfs2_iopen_glops,
    + LM_ST_SHARED, LM_FLAG_TRY);
    + }
    +
    + return 0;
    +}
    +
    +/**
    + * readdir_bad - Read directory entries from a directory
    + * @file: The directory to read from
    + * @dirent: Buffer for dirents
    + * @filldir: Function used to do the copying
    + *
    + * For supporting NFS.
    + *
    + * Returns: errno
    + */
    +
    +static int readdir_bad(struct file *file, void *dirent, filldir_t filldir)
    +{
    + struct gfs2_inode *dip = get_v2ip(file->f_mapping->host);
    + struct gfs2_sbd *sdp = dip->i_sbd;
    + struct filldir_reg fdr;
    + unsigned int entries, size;
    + struct filldir_bad *fdb;
    + struct gfs2_holder d_gh;
    + uint64_t offset = file->f_pos;
    + unsigned int x;
    + struct filldir_bad_entry *fbe;
    + int error;
    +
    + entries = gfs2_tune_get(sdp, gt_entries_per_readdir);
    + size = sizeof(struct filldir_bad) +
    + entries * (sizeof(struct filldir_bad_entry) + GFS2_FAST_NAME_SIZE);
    +
    + fdb = kzalloc(size, GFP_KERNEL);
    + if (!fdb)
    + return -ENOMEM;
    +
    + fdb->fdb_sbd = sdp;
    + fdb->fdb_entry = (struct filldir_bad_entry *)(fdb + 1);
    + fdb->fdb_entry_num = entries;
    + fdb->fdb_name = ((char *)fdb) + sizeof(struct filldir_bad) +
    + entries * sizeof(struct filldir_bad_entry);
    + fdb->fdb_name_size = entries * GFS2_FAST_NAME_SIZE;
    +
    + gfs2_holder_init(dip->i_gl, LM_ST_SHARED, GL_ATIME, &d_gh);
    + error = gfs2_glock_nq_atime(&d_gh);
    + if (error) {
    + gfs2_holder_uninit(&d_gh);
    + goto out;
    + }
    +
    + error = gfs2_dir_read(dip, &offset, fdb, filldir_bad_func);
    +
    + gfs2_glock_dq_uninit(&d_gh);
    +
    + fdr.fdr_sbd = sdp;
    + fdr.fdr_prefetch = 0;
    + fdr.fdr_filldir = filldir;
    + fdr.fdr_opaque = dirent;
    +
    + for (x = 0; x < fdb->fdb_entry_off; x++) {
    + fbe = &fdb->fdb_entry[x];
    +
    + error = filldir_reg_func(&fdr,
    + fbe->fbe_name, fbe->fbe_length,
    + fbe->fbe_offset,
    + &fbe->fbe_inum, fbe->fbe_type);
    + if (error) {
    + file->f_pos = fbe->fbe_offset;
    + error = 0;
    + goto out;
    + }
    + }
    +
    + file->f_pos = offset;
    +
    + out:
    + kfree(fdb);
    +
    + return error;
    +}
    +
    +/**
    + * gfs2_readdir - Read directory entries from a directory
    + * @file: The directory to read from
    + * @dirent: Buffer for dirents
    + * @filldir: Function used to do the copying
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_readdir(struct file *file, void *dirent, filldir_t filldir)
    +{
    + int error;
    +
    + atomic_inc(&get_v2sdp(file->f_mapping->host->i_sb)->sd_ops_file);
    +
    + if (strcmp(current->comm, "nfsd") != 0)
    + error = readdir_reg(file, dirent, filldir);
    + else
    + error = readdir_bad(file, dirent, filldir);
    +
    + return error;
    +}
    +
    +/**
    + * gfs2_ioctl - do an ioctl on a file
    + * @inode: the inode
    + * @file: the file pointer
    + * @cmd: the ioctl command
    + * @arg: the argument
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_ioctl(struct inode *inode, struct file *file, unsigned int cmd,
    + unsigned long arg)
    +{
    + struct gfs2_inode *ip = get_v2ip(inode);
    +
    + atomic_inc(&ip->i_sbd->sd_ops_file);
    +
    + switch (cmd) {
    + case GFS2_IOCTL_IDENTIFY: {
    + unsigned int x = GFS2_MAGIC;
    + if (copy_to_user((unsigned int *)arg, &x, sizeof(unsigned int)))
    + return -EFAULT;
    + return 0;
    + }
    +
    + case GFS2_IOCTL_SUPER:
    + return gfs2_ioctl_i(ip, (void *)arg);
    +
    + default:
    + return -ENOTTY;
    + }
    +}
    +
    +/**
    + * gfs2_mmap -
    + * @file: The file to map
    + * @vma: The VMA which described the mapping
    + *
    + * Returns: 0 or error code
    + */
    +
    +static int gfs2_mmap(struct file *file, struct vm_area_struct *vma)
    +{
    + struct gfs2_inode *ip = get_v2ip(file->f_mapping->host);
    + struct gfs2_holder i_gh;
    + int error;
    +
    + atomic_inc(&ip->i_sbd->sd_ops_file);
    +
    + gfs2_holder_init(ip->i_gl, LM_ST_SHARED, GL_ATIME, &i_gh);
    + error = gfs2_glock_nq_atime(&i_gh);
    + if (error) {
    + gfs2_holder_uninit(&i_gh);
    + return error;
    + }
    +
    + if (gfs2_is_jdata(ip)) {
    + if (vma->vm_flags & VM_MAYSHARE)
    + error = -EOPNOTSUPP;
    + else
    + vma->vm_ops = &gfs2_vm_ops_private;
    + } else {
    + /* This is VM_MAYWRITE instead of VM_WRITE because a call
    + to mprotect() can turn on VM_WRITE later. */
    +
    + if ((vma->vm_flags & (VM_MAYSHARE | VM_MAYWRITE)) ==
    + (VM_MAYSHARE | VM_MAYWRITE))
    + vma->vm_ops = &gfs2_vm_ops_sharewrite;
    + else
    + vma->vm_ops = &gfs2_vm_ops_private;
    + }
    +
    + gfs2_glock_dq_uninit(&i_gh);
    +
    + return error;
    +}
    +
    +/**
    + * gfs2_open - open a file
    + * @inode: the inode to open
    + * @file: the struct file for this opening
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_open(struct inode *inode, struct file *file)
    +{
    + struct gfs2_inode *ip = get_v2ip(inode);
    + struct gfs2_holder i_gh;
    + struct gfs2_file *fp;
    + int error;
    +
    + atomic_inc(&ip->i_sbd->sd_ops_file);
    +
    + fp = kzalloc(sizeof(struct gfs2_file), GFP_KERNEL);
    + if (!fp)
    + return -ENOMEM;
    +
    + init_MUTEX(&fp->f_fl_mutex);
    +
    + fp->f_inode = ip;
    + fp->f_vfile = file;
    +
    + gfs2_assert_warn(ip->i_sbd, !get_v2fp(file));
    + set_v2fp(file, fp);
    +
    + if (S_ISREG(ip->i_di.di_mode)) {
    + error = gfs2_glock_nq_init(ip->i_gl, LM_ST_SHARED, LM_FLAG_ANY,
    + &i_gh);
    + if (error)
    + goto fail;
    +
    + if (!(file->f_flags & O_LARGEFILE) &&
    + ip->i_di.di_size > MAX_NON_LFS) {
    + error = -EFBIG;
    + goto fail_gunlock;
    + }
    +
    + /* Listen to the Direct I/O flag */
    +
    + if (ip->i_di.di_flags & GFS2_DIF_DIRECTIO)
    + file->f_flags |= O_DIRECT;
    +
    + /* Don't let the user open O_DIRECT on a jdata file */
    +
    + if ((file->f_flags & O_DIRECT) && gfs2_is_jdata(ip)) {
    + error = -EINVAL;
    + goto fail_gunlock;
    + }
    +
    + gfs2_glock_dq_uninit(&i_gh);
    + }
    +
    + return 0;
    +
    + fail_gunlock:
    + gfs2_glock_dq_uninit(&i_gh);
    +
    + fail:
    + set_v2fp(file, NULL);
    + kfree(fp);
    +
    + return error;
    +}
    +
    +/**
    + * gfs2_close - called to close a struct file
    + * @inode: the inode the struct file belongs to
    + * @file: the struct file being closed
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_close(struct inode *inode, struct file *file)
    +{
    + struct gfs2_sbd *sdp = get_v2sdp(inode->i_sb);
    + struct gfs2_file *fp;
    +
    + atomic_inc(&sdp->sd_ops_file);
    +
    + fp = get_v2fp(file);
    + set_v2fp(file, NULL);
    +
    + if (gfs2_assert_warn(sdp, fp))
    + return -EIO;
    +
    + kfree(fp);
    +
    + return 0;
    +}
    +
    +/**
    + * gfs2_fsync - sync the dirty data for a file (across the cluster)
    + * @file: the file that points to the dentry (we ignore this)
    + * @dentry: the dentry that points to the inode to sync
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_fsync(struct file *file, struct dentry *dentry, int datasync)
    +{
    + struct gfs2_inode *ip = get_v2ip(dentry->d_inode);
    +
    + atomic_inc(&ip->i_sbd->sd_ops_file);
    + gfs2_log_flush_glock(ip->i_gl);
    +
    + return 0;
    +}
    +
    +/**
    + * gfs2_lock - acquire/release a posix lock on a file
    + * @file: the file pointer
    + * @cmd: either modify or retrieve lock state, possibly wait
    + * @fl: type and range of lock
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_lock(struct file *file, int cmd, struct file_lock *fl)
    +{
    + struct gfs2_inode *ip = get_v2ip(file->f_mapping->host);
    + struct gfs2_sbd *sdp = ip->i_sbd;
    + struct lm_lockname name =
    + { .ln_number = ip->i_num.no_addr,
    + .ln_type = LM_TYPE_PLOCK };
    +
    + atomic_inc(&sdp->sd_ops_file);
    +
    + if (!(fl->fl_flags & FL_POSIX))
    + return -ENOLCK;
    + if ((ip->i_di.di_mode & (S_ISGID | S_IXGRP)) == S_ISGID)
    + return -ENOLCK;
    +
    + if (sdp->sd_args.ar_localflocks) {
    + if (IS_GETLK(cmd)) {
    + struct file_lock *tmp;
    + lock_kernel();
    + tmp = posix_test_lock(file, fl);
    + fl->fl_type = F_UNLCK;
    + if (tmp)
    + memcpy(fl, tmp, sizeof(struct file_lock));
    + unlock_kernel();
    + return 0;
    + } else {
    + int error;
    + lock_kernel();
    + error = posix_lock_file_wait(file, fl);
    + unlock_kernel();
    + return error;
    + }
    + }
    +
    + if (IS_GETLK(cmd))
    + return gfs2_lm_plock_get(sdp, &name, file, fl);
    + else if (fl->fl_type == F_UNLCK)
    + return gfs2_lm_punlock(sdp, &name, file, fl);
    + else
    + return gfs2_lm_plock(sdp, &name, file, cmd, fl);
    +}
    +
    +/**
    + * gfs2_sendfile - Send bytes to a file or socket
    + * @in_file: The file to read from
    + * @out_file: The file to write to
    + * @count: The amount of data
    + * @offset: The beginning file offset
    + *
    + * Outputs: offset - updated according to number of bytes read
    + *
    + * Returns: The number of bytes sent, errno on failure
    + */
    +
    +static ssize_t gfs2_sendfile(struct file *in_file, loff_t *offset, size_t count,
    + read_actor_t actor, void __user *target)
    +{
    + struct gfs2_inode *ip = get_v2ip(in_file->f_mapping->host);
    + struct gfs2_holder gh;
    + ssize_t retval;
    +
    + atomic_inc(&ip->i_sbd->sd_ops_file);
    +
    + gfs2_holder_init(ip->i_gl, LM_ST_SHARED, GL_ATIME, &gh);
    +
    + retval = gfs2_glock_nq_atime(&gh);
    + if (retval)
    + goto out;
    +
    + if (gfs2_is_jdata(ip))
    + retval = -EOPNOTSUPP;
    + else
    + retval = generic_file_sendfile(in_file, offset, count, actor,
    + target);
    +
    + gfs2_glock_dq(&gh);
    +
    + out:
    + gfs2_holder_uninit(&gh);
    +
    + return retval;
    +}
    +
    +static int do_flock(struct file *file, int cmd, struct file_lock *fl)
    +{
    + struct gfs2_file *fp = get_v2fp(file);
    + struct gfs2_holder *fl_gh = &fp->f_fl_gh;
    + struct gfs2_inode *ip = fp->f_inode;
    + struct gfs2_glock *gl;
    + unsigned int state;
    + int flags;
    + int error = 0;
    +
    + state = (fl->fl_type == F_WRLCK) ? LM_ST_EXCLUSIVE : LM_ST_SHARED;
    + flags = ((IS_SETLKW(cmd)) ? 0 : LM_FLAG_TRY) | GL_EXACT | GL_NOCACHE;
    +
    + down(&fp->f_fl_mutex);
    +
    + gl = fl_gh->gh_gl;
    + if (gl) {
    + if (fl_gh->gh_state == state)
    + goto out;
    + gfs2_glock_hold(gl);
    + flock_lock_file_wait(file,
    + &(struct file_lock){.fl_type = F_UNLCK});
    + gfs2_glock_dq_uninit(fl_gh);
    + } else {
    + error = gfs2_glock_get(ip->i_sbd,
    + ip->i_num.no_addr, &gfs2_flock_glops,
    + CREATE, &gl);
    + if (error)
    + goto out;
    + }
    +
    + gfs2_holder_init(gl, state, flags, fl_gh);
    + gfs2_glock_put(gl);
    +
    + error = gfs2_glock_nq(fl_gh);
    + if (error) {
    + gfs2_holder_uninit(fl_gh);
    + if (error == GLR_TRYFAILED)
    + error = -EAGAIN;
    + } else {
    + error = flock_lock_file_wait(file, fl);
    + gfs2_assert_warn(ip->i_sbd, !error);
    + }
    +
    + out:
    + up(&fp->f_fl_mutex);
    +
    + return error;
    +}
    +
    +static void do_unflock(struct file *file, struct file_lock *fl)
    +{
    + struct gfs2_file *fp = get_v2fp(file);
    + struct gfs2_holder *fl_gh = &fp->f_fl_gh;
    +
    + down(&fp->f_fl_mutex);
    + flock_lock_file_wait(file, fl);
    + if (fl_gh->gh_gl)
    + gfs2_glock_dq_uninit(fl_gh);
    + up(&fp->f_fl_mutex);
    +}
    +
    +/**
    + * gfs2_flock - acquire/release a flock lock on a file
    + * @file: the file pointer
    + * @cmd: either modify or retrieve lock state, possibly wait
    + * @fl: type and range of lock
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_flock(struct file *file, int cmd, struct file_lock *fl)
    +{
    + struct gfs2_inode *ip = get_v2ip(file->f_mapping->host);
    + struct gfs2_sbd *sdp = ip->i_sbd;
    +
    + atomic_inc(&ip->i_sbd->sd_ops_file);
    +
    + if (!(fl->fl_flags & FL_FLOCK))
    + return -ENOLCK;
    + if ((ip->i_di.di_mode & (S_ISGID | S_IXGRP)) == S_ISGID)
    + return -ENOLCK;
    +
    + if (sdp->sd_args.ar_localflocks)
    + return flock_lock_file_wait(file, fl);
    +
    + if (fl->fl_type == F_UNLCK) {
    + do_unflock(file, fl);
    + return 0;
    + } else
    + return do_flock(file, cmd, fl);
    +}
    +
    +struct file_operations gfs2_file_fops = {
    + .llseek = gfs2_llseek,
    + .read = gfs2_read,
    + .write = gfs2_write,
    + .ioctl = gfs2_ioctl,
    + .mmap = gfs2_mmap,
    + .open = gfs2_open,
    + .release = gfs2_close,
    + .fsync = gfs2_fsync,
    + .lock = gfs2_lock,
    + .sendfile = gfs2_sendfile,
    + .flock = gfs2_flock,
    +};
    +
    +struct file_operations gfs2_dir_fops = {
    + .readdir = gfs2_readdir,
    + .ioctl = gfs2_ioctl,
    + .open = gfs2_open,
    + .release = gfs2_close,
    + .fsync = gfs2_fsync,
    + .lock = gfs2_lock,
    + .flock = gfs2_flock,
    +};
    +
    --- a/fs/gfs2/ops_file.h 1969-12-31 17:00:00.000000000 -0700
    +++ b/fs/gfs2/ops_file.h 2005-10-10 11:28:49.294787259 -0500
    @@ -0,0 +1,16 @@
    +/*
    + * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
    + * Copyright (C) 2004-2005 Red Hat, Inc. All rights reserved.
    + *
    + * This copyrighted material is made available to anyone wishing to use,
    + * modify, copy, or redistribute it subject to the terms and conditions
    + * of the GNU General Public License v.2.
    + */
    +
    +#ifndef __OPS_FILE_DOT_H__
    +#define __OPS_FILE_DOT_H__
    +
    +extern struct file_operations gfs2_file_fops;
    +extern struct file_operations gfs2_dir_fops;
    +
    +#endif /* __OPS_FILE_DOT_H__ */
    --- a/fs/gfs2/ops_fstype.c 1969-12-31 17:00:00.000000000 -0700
    +++ b/fs/gfs2/ops_fstype.c 2005-10-10 11:28:49.301786168 -0500
    @@ -0,0 +1,860 @@
    +/*
    + * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
    + * Copyright (C) 2004-2005 Red Hat, Inc. All rights reserved.
    + *
    + * This copyrighted material is made available to anyone wishing to use,
    + * modify, copy, or redistribute it subject to the terms and conditions
    + * of the GNU General Public License v.2.
    + */
    +
    +#include <linux/sched.h>
    +#include <linux/slab.h>
    +#include <linux/spinlock.h>
    +#include <linux/completion.h>
    +#include <linux/buffer_head.h>
    +#include <linux/vmalloc.h>
    +#include <linux/blkdev.h>
    +#include <linux/kthread.h>
    +#include <asm/semaphore.h>
    +
    +#include "gfs2.h"
    +#include "daemon.h"
    +#include "glock.h"
    +#include "glops.h"
    +#include "inode.h"
    +#include "lm.h"
    +#include "mount.h"
    +#include "ops_export.h"
    +#include "ops_fstype.h"
    +#include "ops_super.h"
    +#include "recovery.h"
    +#include "rgrp.h"
    +#include "super.h"
    +#include "unlinked.h"
    +#include "sys.h"
    +
    +#define DO 0
    +#define UNDO 1
    +
    +static struct gfs2_sbd *init_sbd(struct super_block *sb)
    +{
    + struct gfs2_sbd *sdp;
    + unsigned int x;
    +
    + sdp = vmalloc(sizeof(struct gfs2_sbd));
    + if (!sdp)
    + return NULL;
    +
    + memset(sdp, 0, sizeof(struct gfs2_sbd));
    +
    + set_v2sdp(sb, sdp);
    + sdp->sd_vfs = sb;
    +
    + gfs2_tune_init(&sdp->sd_tune);
    +
    + for (x = 0; x < GFS2_GL_HASH_SIZE; x++) {
    + sdp->sd_gl_hash[x].hb_lock = RW_LOCK_UNLOCKED;
    + INIT_LIST_HEAD(&sdp->sd_gl_hash[x].hb_list);
    + }
    + INIT_LIST_HEAD(&sdp->sd_reclaim_list);
    + spin_lock_init(&sdp->sd_reclaim_lock);
    + init_waitqueue_head(&sdp->sd_reclaim_wq);
    +
    + init_MUTEX(&sdp->sd_inum_mutex);
    + spin_lock_init(&sdp->sd_statfs_spin);
    + init_MUTEX(&sdp->sd_statfs_mutex);
    +
    + spin_lock_init(&sdp->sd_rindex_spin);
    + init_MUTEX(&sdp->sd_rindex_mutex);
    + INIT_LIST_HEAD(&sdp->sd_rindex_list);
    + INIT_LIST_HEAD(&sdp->sd_rindex_mru_list);
    + INIT_LIST_HEAD(&sdp->sd_rindex_recent_list);
    +
    + INIT_LIST_HEAD(&sdp->sd_jindex_list);
    + spin_lock_init(&sdp->sd_jindex_spin);
    + init_MUTEX(&sdp->sd_jindex_mutex);
    +
    + INIT_LIST_HEAD(&sdp->sd_unlinked_list);
    + spin_lock_init(&sdp->sd_unlinked_spin);
    + init_MUTEX(&sdp->sd_unlinked_mutex);
    +
    + INIT_LIST_HEAD(&sdp->sd_quota_list);
    + spin_lock_init(&sdp->sd_quota_spin);
    + init_MUTEX(&sdp->sd_quota_mutex);
    +
    + spin_lock_init(&sdp->sd_log_lock);
    + init_waitqueue_head(&sdp->sd_log_trans_wq);
    + init_waitqueue_head(&sdp->sd_log_flush_wq);
    +
    + INIT_LIST_HEAD(&sdp->sd_log_le_gl);
    + INIT_LIST_HEAD(&sdp->sd_log_le_buf);
    + INIT_LIST_HEAD(&sdp->sd_log_le_revoke);
    + INIT_LIST_HEAD(&sdp->sd_log_le_rg);
    + INIT_LIST_HEAD(&sdp->sd_log_le_databuf);
    +
    + INIT_LIST_HEAD(&sdp->sd_log_blks_list);
    + init_waitqueue_head(&sdp->sd_log_blks_wait);
    +
    + INIT_LIST_HEAD(&sdp->sd_ail1_list);
    + INIT_LIST_HEAD(&sdp->sd_ail2_list);
    +
    + init_MUTEX(&sdp->sd_log_flush_lock);
    + INIT_LIST_HEAD(&sdp->sd_log_flush_list);
    +
    + INIT_LIST_HEAD(&sdp->sd_revoke_list);
    +
    + init_MUTEX(&sdp->sd_freeze_lock);
    +
    + return sdp;
    +}
    +
    +static void init_vfs(struct gfs2_sbd *sdp)
    +{
    + struct super_block *sb = sdp->sd_vfs;
    +
    + sb->s_magic = GFS2_MAGIC;
    + sb->s_op = &gfs2_super_ops;
    + sb->s_export_op = &gfs2_export_ops;
    + sb->s_maxbytes = MAX_LFS_FILESIZE;
    +
    + if (sb->s_flags & (MS_NOATIME | MS_NODIRATIME))
    + set_bit(SDF_NOATIME, &sdp->sd_flags);
    +
    + /* Don't let the VFS update atimes. GFS2 handles this itself. */
    + sb->s_flags |= MS_NOATIME | MS_NODIRATIME;
    +
    + /* Set up the buffer cache and fill in some fake block size values
    + to allow us to read-in the on-disk superblock. */
    + sdp->sd_sb.sb_bsize = sb_min_blocksize(sb, GFS2_BASIC_BLOCK);
    + sdp->sd_sb.sb_bsize_shift = sb->s_blocksize_bits;
    + sdp->sd_fsb2bb_shift = sdp->sd_sb.sb_bsize_shift - GFS2_BASIC_BLOCK_SHIFT;
    + sdp->sd_fsb2bb = 1 << sdp->sd_fsb2bb_shift;
    +}
    +
    +static int init_names(struct gfs2_sbd *sdp, int silent)
    +{
    + struct gfs2_sb *sb = NULL;
    + char *proto, *table;
    + int error = 0;
    +
    + proto = sdp->sd_args.ar_lockproto;
    + table = sdp->sd_args.ar_locktable;
    +
    + /* Try to autodetect */
    +
    + if (!proto[0] || !table[0]) {
    + struct buffer_head *bh;
    + bh = sb_getblk(sdp->sd_vfs,
    + GFS2_SB_ADDR >> sdp->sd_fsb2bb_shift);
    + lock_buffer(bh);
    + clear_buffer_uptodate(bh);
    + clear_buffer_dirty(bh);
    + unlock_buffer(bh);
    + ll_rw_block(READ, 1, &bh);
    + wait_on_buffer(bh);
    +
    + if (!buffer_uptodate(bh)) {
    + brelse(bh);
    + return -EIO;
    + }
    +
    + sb = kmalloc(sizeof(struct gfs2_sb), GFP_KERNEL);
    + if (!sb) {
    + brelse(bh);
    + return -ENOMEM;
    + }
    + gfs2_sb_in(sb, bh->b_data);
    + brelse(bh);
    +
    + error = gfs2_check_sb(sdp, sb, silent);
    + if (error)
    + goto out;
    +
    + if (!proto[0])
    + proto = sb->sb_lockproto;
    + if (!table[0])
    + table = sb->sb_locktable;
    + }
    +
    + if (!table[0])
    + table = sdp->sd_vfs->s_id;
    +
    + snprintf(sdp->sd_proto_name, GFS2_FSNAME_LEN, "%s", proto);
    + snprintf(sdp->sd_table_name, GFS2_FSNAME_LEN, "%s", table);
    +
    + out:
    + kfree(sb);
    +
    + return error;
    +}
    +
    +static int init_locking(struct gfs2_sbd *sdp, struct gfs2_holder *mount_gh,
    + int undo)
    +{
    + struct task_struct *p;
    + int error = 0;
    +
    + if (undo)
    + goto fail_trans;
    +
    + p = kthread_run(gfs2_scand, sdp, "gfs2_scand");
    + error = IS_ERR(p);
    + if (error) {
    + fs_err(sdp, "can't start scand thread: %d\n", error);
    + return error;
    + }
    + sdp->sd_scand_process = p;
    +
    + for (sdp->sd_glockd_num = 0;
    + sdp->sd_glockd_num < sdp->sd_args.ar_num_glockd;
    + sdp->sd_glockd_num++) {
    + p = kthread_run(gfs2_glockd, sdp, "gfs2_glockd");
    + error = IS_ERR(p);
    + if (error) {
    + fs_err(sdp, "can't start glockd thread: %d\n", error);
    + goto fail;
    + }
    + sdp->sd_glockd_process[sdp->sd_glockd_num] = p;
    + }
    +
    + error = gfs2_glock_nq_num(sdp,
    + GFS2_MOUNT_LOCK, &gfs2_nondisk_glops,
    + LM_ST_EXCLUSIVE, LM_FLAG_NOEXP | GL_NOCACHE,
    + mount_gh);
    + if (error) {
    + fs_err(sdp, "can't acquire mount glock: %d\n", error);
    + goto fail;
    + }
    +
    + error = gfs2_glock_nq_num(sdp,
    + GFS2_LIVE_LOCK, &gfs2_nondisk_glops,
    + LM_ST_SHARED,
    + LM_FLAG_NOEXP | GL_EXACT | GL_NEVER_RECURSE,
    + &sdp->sd_live_gh);
    + if (error) {
    + fs_err(sdp, "can't acquire live glock: %d\n", error);
    + goto fail_mount;
    + }
    +
    + error = gfs2_glock_get(sdp, GFS2_RENAME_LOCK, &gfs2_nondisk_glops,
    + CREATE, &sdp->sd_rename_gl);
    + if (error) {
    + fs_err(sdp, "can't create rename glock: %d\n", error);
    + goto fail_live;
    + }
    +
    + error = gfs2_glock_get(sdp, GFS2_TRANS_LOCK, &gfs2_trans_glops,
    + CREATE, &sdp->sd_trans_gl);
    + if (error) {
    + fs_err(sdp, "can't create transaction glock: %d\n", error);
    + goto fail_rename;
    + }
    + set_bit(GLF_STICKY, &sdp->sd_trans_gl->gl_flags);
    +
    + return 0;
    +
    + fail_trans:
    + gfs2_glock_put(sdp->sd_trans_gl);
    +
    + fail_rename:
    + gfs2_glock_put(sdp->sd_rename_gl);
    +
    + fail_live:
    + gfs2_glock_dq_uninit(&sdp->sd_live_gh);
    +
    + fail_mount:
    + gfs2_glock_dq_uninit(mount_gh);
    +
    + fail:
    + while (sdp->sd_glockd_num--)
    + kthread_stop(sdp->sd_glockd_process[sdp->sd_glockd_num]);
    +
    + kthread_stop(sdp->sd_scand_process);
    +
    + return error;
    +}
    +
    +static int init_sb(struct gfs2_sbd *sdp, int silent, int undo)
    +{
    + struct super_block *sb = sdp->sd_vfs;
    + struct gfs2_holder sb_gh;
    + int error = 0;
    +
    + if (undo) {
    + gfs2_inode_put(sdp->sd_master_dir);
    + return 0;
    + }
    +
    + error = gfs2_glock_nq_num(sdp,
    + GFS2_SB_LOCK, &gfs2_meta_glops,
    + LM_ST_SHARED, 0, &sb_gh);
    + if (error) {
    + fs_err(sdp, "can't acquire superblock glock: %d\n", error);
    + return error;
    + }
    +
    + error = gfs2_read_sb(sdp, sb_gh.gh_gl, silent);
    + if (error) {
    + fs_err(sdp, "can't read superblock: %d\n", error);
    + goto out;
    + }
    +
    + /* Set up the buffer cache and SB for real */
    + error = -EINVAL;
    + if (sdp->sd_sb.sb_bsize < bdev_hardsect_size(sb->s_bdev)) {
    + fs_err(sdp, "FS block size (%u) is too small for device "
    + "block size (%u)\n",
    + sdp->sd_sb.sb_bsize, bdev_hardsect_size(sb->s_bdev));
    + goto out;
    + }
    + if (sdp->sd_sb.sb_bsize > PAGE_SIZE) {
    + fs_err(sdp, "FS block size (%u) is too big for machine "
    + "page size (%u)\n",
    + sdp->sd_sb.sb_bsize, (unsigned int)PAGE_SIZE);
    + goto out;
    + }
    +
    + /* Get rid of buffers from the original block size */
    + sb_gh.gh_gl->gl_ops->go_inval(sb_gh.gh_gl, DIO_METADATA | DIO_DATA);
    + sb_gh.gh_gl->gl_aspace->i_blkbits = sdp->sd_sb.sb_bsize_shift;
    +
    + sb_set_blocksize(sb, sdp->sd_sb.sb_bsize);
    +
    + error = gfs2_lookup_master_dir(sdp);
    + if (error)
    + fs_err(sdp, "can't read in master directory: %d\n", error);
    +
    + out:
    + gfs2_glock_dq_uninit(&sb_gh);
    +
    + return error;
    +}
    +
    +static int init_journal(struct gfs2_sbd *sdp, int undo)
    +{
    + struct gfs2_holder ji_gh;
    + struct task_struct *p;
    + int jindex = 1;
    + int error = 0;
    +
    + if (undo) {
    + jindex = 0;
    + goto fail_recoverd;
    + }
    +
    + error = gfs2_lookup_simple(sdp->sd_master_dir, "jindex",
    + &sdp->sd_jindex);
    + if (error) {
    + fs_err(sdp, "can't lookup journal index: %d\n", error);
    + return error;
    + }
    + set_bit(GLF_STICKY, &sdp->sd_jindex->i_gl->gl_flags);
    +
    + /* Load in the journal index special file */
    +
    + error = gfs2_jindex_hold(sdp, &ji_gh);
    + if (error) {
    + fs_err(sdp, "can't read journal index: %d\n", error);
    + goto fail;
    + }
    +
    + error = -EINVAL;
    + if (!gfs2_jindex_size(sdp)) {
    + fs_err(sdp, "no journals!\n");
    + goto fail_jindex;
    + }
    +
    + if (sdp->sd_args.ar_spectator) {
    + sdp->sd_jdesc = gfs2_jdesc_find(sdp, 0);
    + sdp->sd_log_blks_free = sdp->sd_jdesc->jd_blocks;
    + } else {
    + if (sdp->sd_lockstruct.ls_jid >= gfs2_jindex_size(sdp)) {
    + fs_err(sdp, "can't mount journal #%u\n",
    + sdp->sd_lockstruct.ls_jid);
    + fs_err(sdp, "there are only %u journals (0 - %u)\n",
    + gfs2_jindex_size(sdp),
    + gfs2_jindex_size(sdp) - 1);
    + goto fail_jindex;
    + }
    + sdp->sd_jdesc = gfs2_jdesc_find(sdp, sdp->sd_lockstruct.ls_jid);
    +
    + error = gfs2_glock_nq_num(sdp,
    + sdp->sd_lockstruct.ls_jid,
    + &gfs2_journal_glops,
    + LM_ST_EXCLUSIVE, LM_FLAG_NOEXP,
    + &sdp->sd_journal_gh);
    + if (error) {
    + fs_err(sdp, "can't acquire journal glock: %d\n", error);
    + goto fail_jindex;
    + }
    +
    + error = gfs2_glock_nq_init(sdp->sd_jdesc->jd_inode->i_gl,
    + LM_ST_SHARED,
    + LM_FLAG_NOEXP | GL_EXACT,
    + &sdp->sd_jinode_gh);
    + if (error) {
    + fs_err(sdp, "can't acquire journal inode glock: %d\n",
    + error);
    + goto fail_journal_gh;
    + }
    +
    + error = gfs2_jdesc_check(sdp->sd_jdesc);
    + if (error) {
    + fs_err(sdp, "my journal (%u) is bad: %d\n",
    + sdp->sd_jdesc->jd_jid, error);
    + goto fail_jinode_gh;
    + }
    + sdp->sd_log_blks_free = sdp->sd_jdesc->jd_blocks;
    + }
    +
    + if (sdp->sd_lockstruct.ls_first) {
    + unsigned int x;
    + for (x = 0; x < sdp->sd_journals; x++) {
    + error = gfs2_recover_journal(gfs2_jdesc_find(sdp, x),
    + WAIT);
    + if (error) {
    + fs_err(sdp, "error recovering journal %u: %d\n",
    + x, error);
    + goto fail_jinode_gh;
    + }
    + }
    +
    + gfs2_lm_others_may_mount(sdp);
    + } else if (!sdp->sd_args.ar_spectator) {
    + error = gfs2_recover_journal(sdp->sd_jdesc, WAIT);
    + if (error) {
    + fs_err(sdp, "error recovering my journal: %d\n", error);
    + goto fail_jinode_gh;
    + }
    + }
    +
    + set_bit(SDF_JOURNAL_CHECKED, &sdp->sd_flags);
    + gfs2_glock_dq_uninit(&ji_gh);
    + jindex = 0;
    +
    + /* Disown my Journal glock */
    +
    + sdp->sd_journal_gh.gh_owner = NULL;
    + sdp->sd_jinode_gh.gh_owner = NULL;
    +
    + p = kthread_run(gfs2_recoverd, sdp, "gfs2_recoverd");
    + error = IS_ERR(p);
    + if (error) {
    + fs_err(sdp, "can't start recoverd thread: %d\n", error);
    + goto fail_jinode_gh;
    + }
    + sdp->sd_recoverd_process = p;
    +
    + return 0;
    +
    + fail_recoverd:
    + kthread_stop(sdp->sd_recoverd_process);
    +
    + fail_jinode_gh:
    + if (!sdp->sd_args.ar_spectator)
    + gfs2_glock_dq_uninit(&sdp->sd_jinode_gh);
    +
    + fail_journal_gh:
    + if (!sdp->sd_args.ar_spectator)
    + gfs2_glock_dq_uninit(&sdp->sd_journal_gh);
    +
    + fail_jindex:
    + gfs2_jindex_free(sdp);
    + if (jindex)
    + gfs2_glock_dq_uninit(&ji_gh);
    +
    + fail:
    + gfs2_inode_put(sdp->sd_jindex);
    +
    + return error;
    +}
    +
    +static int init_inodes(struct gfs2_sbd *sdp, int undo)
    +{
    + struct inode *inode;
    + struct dentry **dentry = &sdp->sd_vfs->s_root;
    + int error = 0;
    +
    + if (undo)
    + goto fail_dput;
    +
    + /* Read in the master inode number inode */
    + error = gfs2_lookup_simple(sdp->sd_master_dir, "inum",
    + &sdp->sd_inum_inode);
    + if (error) {
    + fs_err(sdp, "can't read in inum inode: %d\n", error);
    + return error;
    + }
    +
    + /* Read in the master statfs inode */
    + error = gfs2_lookup_simple(sdp->sd_master_dir, "statfs",
    + &sdp->sd_statfs_inode);
    + if (error) {
    + fs_err(sdp, "can't read in statfs inode: %d\n", error);
    + goto fail;
    + }
    +
    + /* Read in the resource index inode */
    + error = gfs2_lookup_simple(sdp->sd_master_dir, "rindex",
    + &sdp->sd_rindex);
    + if (error) {
    + fs_err(sdp, "can't get resource index inode: %d\n", error);
    + goto fail_statfs;
    + }
    + set_bit(GLF_STICKY, &sdp->sd_rindex->i_gl->gl_flags);
    + sdp->sd_rindex_vn = sdp->sd_rindex->i_gl->gl_vn - 1;
    +
    + /* Read in the quota inode */
    + error = gfs2_lookup_simple(sdp->sd_master_dir, "quota",
    + &sdp->sd_quota_inode);
    + if (error) {
    + fs_err(sdp, "can't get quota file inode: %d\n", error);
    + goto fail_rindex;
    + }
    +
    + /* Get the root inode */
    + error = gfs2_lookup_simple(sdp->sd_master_dir, "root",
    + &sdp->sd_root_dir);
    + if (error) {
    + fs_err(sdp, "can't read in root inode: %d\n", error);
    + goto fail_qinode;
    + }
    +
    + /* Get the root inode/dentry */
    + inode = gfs2_ip2v(sdp->sd_root_dir);
    + if (!inode) {
    + fs_err(sdp, "can't get root inode\n");
    + error = -ENOMEM;
    + goto fail_rooti;
    + }
    +
    + *dentry = d_alloc_root(inode);
    + if (!*dentry) {
    + iput(inode);
    + fs_err(sdp, "can't get root dentry\n");
    + error = -ENOMEM;
    + goto fail_rooti;
    + }
    +
    + return 0;
    +
    + fail_dput:
    + dput(*dentry);
    + *dentry = NULL;
    +
    + fail_rooti:
    + gfs2_inode_put(sdp->sd_root_dir);
    +
    + fail_qinode:
    + gfs2_inode_put(sdp->sd_quota_inode);
    +
    + fail_rindex:
    + gfs2_clear_rgrpd(sdp);
    + gfs2_inode_put(sdp->sd_rindex);
    +
    + fail_statfs:
    + gfs2_inode_put(sdp->sd_statfs_inode);
    +
    + fail:
    + gfs2_inode_put(sdp->sd_inum_inode);
    +
    + return error;
    +}
    +
    +static int init_per_node(struct gfs2_sbd *sdp, int undo)
    +{
    + struct gfs2_inode *pn = NULL;
    + char buf[30];
    + int error = 0;
    +
    + if (sdp->sd_args.ar_spectator)
    + return 0;
    +
    + if (undo)
    + goto fail_qc_gh;
    +
    + error = gfs2_lookup_simple(sdp->sd_master_dir, "per_node", &pn);
    + if (error) {
    + fs_err(sdp, "can't find per_node directory: %d\n", error);
    + return error;
    + }
    +
    + sprintf(buf, "inum_range%u", sdp->sd_jdesc->jd_jid);
    + error = gfs2_lookup_simple(pn, buf, &sdp->sd_ir_inode);
    + if (error) {
    + fs_err(sdp, "can't find local \"ir\" file: %d\n", error);
    + goto fail;
    + }
    +
    + sprintf(buf, "statfs_change%u", sdp->sd_jdesc->jd_jid);
    + error = gfs2_lookup_simple(pn, buf, &sdp->sd_sc_inode);
    + if (error) {
    + fs_err(sdp, "can't find local \"sc\" file: %d\n", error);
    + goto fail_ir_i;
    + }
    +
    + sprintf(buf, "unlinked_tag%u", sdp->sd_jdesc->jd_jid);
    + error = gfs2_lookup_simple(pn, buf, &sdp->sd_ut_inode);
    + if (error) {
    + fs_err(sdp, "can't find local \"ut\" file: %d\n", error);
    + goto fail_sc_i;
    + }
    +
    + sprintf(buf, "quota_change%u", sdp->sd_jdesc->jd_jid);
    + error = gfs2_lookup_simple(pn, buf, &sdp->sd_qc_inode);
    + if (error) {
    + fs_err(sdp, "can't find local \"qc\" file: %d\n", error);
    + goto fail_ut_i;
    + }
    +
    + gfs2_inode_put(pn);
    + pn = NULL;
    +
    + error = gfs2_glock_nq_init(sdp->sd_ir_inode->i_gl,
    + LM_ST_EXCLUSIVE, GL_NEVER_RECURSE,
    + &sdp->sd_ir_gh);
    + if (error) {
    + fs_err(sdp, "can't lock local \"ir\" file: %d\n", error);
    + goto fail_qc_i;
    + }
    +
    + error = gfs2_glock_nq_init(sdp->sd_sc_inode->i_gl,
    + LM_ST_EXCLUSIVE, GL_NEVER_RECURSE,
    + &sdp->sd_sc_gh);
    + if (error) {
    + fs_err(sdp, "can't lock local \"sc\" file: %d\n", error);
    + goto fail_ir_gh;
    + }
    +
    + error = gfs2_glock_nq_init(sdp->sd_ut_inode->i_gl,
    + LM_ST_EXCLUSIVE, GL_NEVER_RECURSE,
    + &sdp->sd_ut_gh);
    + if (error) {
    + fs_err(sdp, "can't lock local \"ut\" file: %d\n", error);
    + goto fail_sc_gh;
    + }
    +
    + error = gfs2_glock_nq_init(sdp->sd_qc_inode->i_gl,
    + LM_ST_EXCLUSIVE, GL_NEVER_RECURSE,
    + &sdp->sd_qc_gh);
    + if (error) {
    + fs_err(sdp, "can't lock local \"qc\" file: %d\n", error);
    + goto fail_ut_gh;
    + }
    +
    + return 0;
    +
    + fail_qc_gh:
    + gfs2_glock_dq_uninit(&sdp->sd_qc_gh);
    +
    + fail_ut_gh:
    + gfs2_glock_dq_uninit(&sdp->sd_ut_gh);
    +
    + fail_sc_gh:
    + gfs2_glock_dq_uninit(&sdp->sd_sc_gh);
    +
    + fail_ir_gh:
    + gfs2_glock_dq_uninit(&sdp->sd_ir_gh);
    +
    + fail_qc_i:
    + gfs2_inode_put(sdp->sd_qc_inode);
    +
    + fail_ut_i:
    + gfs2_inode_put(sdp->sd_ut_inode);
    +
    + fail_sc_i:
    + gfs2_inode_put(sdp->sd_sc_inode);
    +
    + fail_ir_i:
    + gfs2_inode_put(sdp->sd_ir_inode);
    +
    + fail:
    + if (pn)
    + gfs2_inode_put(pn);
    + return error;
    +}
    +
    +static int init_threads(struct gfs2_sbd *sdp, int undo)
    +{
    + struct task_struct *p;
    + int error = 0;
    +
    + if (undo)
    + goto fail_inoded;
    +
    + sdp->sd_log_flush_time = jiffies;
    + sdp->sd_jindex_refresh_time = jiffies;
    +
    + p = kthread_run(gfs2_logd, sdp, "gfs2_logd");
    + error = IS_ERR(p);
    + if (error) {
    + fs_err(sdp, "can't start logd thread: %d\n", error);
    + return error;
    + }
    + sdp->sd_logd_process = p;
    +
    + sdp->sd_statfs_sync_time = jiffies;
    + sdp->sd_quota_sync_time = jiffies;
    +
    + p = kthread_run(gfs2_quotad, sdp, "gfs2_quotad");
    + error = IS_ERR(p);
    + if (error) {
    + fs_err(sdp, "can't start quotad thread: %d\n", error);
    + goto fail;
    + }
    + sdp->sd_quotad_process = p;
    +
    + p = kthread_run(gfs2_inoded, sdp, "gfs2_inoded");
    + error = IS_ERR(p);
    + if (error) {
    + fs_err(sdp, "can't start inoded thread: %d\n", error);
    + goto fail_quotad;
    + }
    + sdp->sd_inoded_process = p;
    +
    + return 0;
    +
    + fail_inoded:
    + kthread_stop(sdp->sd_inoded_process);
    +
    + fail_quotad:
    + kthread_stop(sdp->sd_quotad_process);
    +
    + fail:
    + kthread_stop(sdp->sd_logd_process);
    +
    + return error;
    +}
    +
    +/**
    + * fill_super - Read in superblock
    + * @sb: The VFS superblock
    + * @data: Mount options
    + * @silent: Don't complain if it's not a GFS2 filesystem
    + *
    + * Returns: errno
    + */
    +
    +static int fill_super(struct super_block *sb, void *data, int silent)
    +{
    + struct gfs2_sbd *sdp;
    + struct gfs2_holder mount_gh;
    + int error;
    +
    + sdp = init_sbd(sb);
    + if (!sdp) {
    + printk("GFS2: can't alloc struct gfs2_sbd\n");
    + return -ENOMEM;
    + }
    +
    + error = gfs2_mount_args(sdp, (char *)data, 0);
    + if (error) {
    + printk("GFS2: can't parse mount arguments\n");
    + goto fail;
    + }
    +
    + init_vfs(sdp);
    +
    + error = init_names(sdp, silent);
    + if (error)
    + goto fail;
    +
    + error = gfs2_sys_fs_add(sdp);
    + if (error)
    + goto fail;
    +
    + error = gfs2_lm_mount(sdp, silent);
    + if (error)
    + goto fail_sys;
    +
    + error = init_locking(sdp, &mount_gh, DO);
    + if (error)
    + goto fail_lm;
    +
    + error = init_sb(sdp, silent, DO);
    + if (error)
    + goto fail_locking;
    +
    + error = init_journal(sdp, DO);
    + if (error)
    + goto fail_sb;
    +
    + error = init_inodes(sdp, DO);
    + if (error)
    + goto fail_journals;
    +
    + error = init_per_node(sdp, DO);
    + if (error)
    + goto fail_inodes;
    +
    + error = gfs2_statfs_init(sdp);
    + if (error) {
    + fs_err(sdp, "can't initialize statfs subsystem: %d\n", error);
    + goto fail_per_node;
    + }
    +
    + error = init_threads(sdp, DO);
    + if (error)
    + goto fail_per_node;
    +
    + if (!(sb->s_flags & MS_RDONLY)) {
    + error = gfs2_make_fs_rw(sdp);
    + if (error) {
    + fs_err(sdp, "can't make FS RW: %d\n", error);
    + goto fail_threads;
    + }
    + }
    +
    + gfs2_glock_dq_uninit(&mount_gh);
    +
    + return 0;
    +
    + fail_threads:
    + init_threads(sdp, UNDO);
    +
    + fail_per_node:
    + init_per_node(sdp, UNDO);
    +
    + fail_inodes:
    + init_inodes(sdp, UNDO);
    +
    + fail_journals:
    + init_journal(sdp, UNDO);
    +
    + fail_sb:
    + init_sb(sdp, 0, UNDO);
    +
    + fail_locking:
    + init_locking(sdp, &mount_gh, UNDO);
    +
    + fail_lm:
    + gfs2_gl_hash_clear(sdp, WAIT);
    + gfs2_lm_unmount(sdp);
    + while (invalidate_inodes(sb))
    + yield();
    +
    + fail_sys:
    + gfs2_sys_fs_del(sdp);
    +
    + fail:
    + vfree(sdp);
    + set_v2sdp(sb, NULL);
    +
    + return error;
    +}
    +
    +static struct super_block *gfs2_get_sb(struct file_system_type *fs_type,
    + int flags, const char *dev_name,
    + void *data)
    +{
    + return get_sb_bdev(fs_type, flags, dev_name, data, fill_super);
    +}
    +
    +struct file_system_type gfs2_fs_type = {
    + .name = "gfs2",
    + .fs_flags = FS_REQUIRES_DEV,
    + .get_sb = gfs2_get_sb,
    + .kill_sb = kill_block_super,
    + .owner = THIS_MODULE,
    +};
    +
    --- a/fs/gfs2/ops_fstype.h 1969-12-31 17:00:00.000000000 -0700
    +++ b/fs/gfs2/ops_fstype.h 2005-10-10 11:28:49.305785544 -0500
    @@ -0,0 +1,15 @@
    +/*
    + * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
    + * Copyright (C) 2004-2005 Red Hat, Inc. All rights reserved.
    + *
    + * This copyrighted material is made available to anyone wishing to use,
    + * modify, copy, or redistribute it subject to the terms and conditions
    + * of the GNU General Public License v.2.
    + */
    +
    +#ifndef __OPS_FSTYPE_DOT_H__
    +#define __OPS_FSTYPE_DOT_H__
    +
    +extern struct file_system_type gfs2_fs_type;
    +
    +#endif /* __OPS_FSTYPE_DOT_H__ */
    --- a/fs/gfs2/ops_inode.c 1969-12-31 17:00:00.000000000 -0700
    +++ b/fs/gfs2/ops_inode.c 2005-10-10 11:28:49.307785232 -0500
    @@ -0,0 +1,1265 @@
    +/*
    + * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
    + * Copyright (C) 2004-2005 Red Hat, Inc. All rights reserved.
    + *
    + * This copyrighted material is made available to anyone wishing to use,
    + * modify, copy, or redistribute it subject to the terms and conditions
    + * of the GNU General Public License v.2.
    + */
    +
    +#include <linux/sched.h>
    +#include <linux/slab.h>
    +#include <linux/spinlock.h>
    +#include <linux/completion.h>
    +#include <linux/buffer_head.h>
    +#include <linux/namei.h>
    +#include <linux/utsname.h>
    +#include <linux/mm.h>
    +#include <linux/xattr.h>
    +#include <linux/posix_acl.h>
    +#include <asm/semaphore.h>
    +#include <asm/uaccess.h>
    +
    +#include "gfs2.h"
    +#include "acl.h"
    +#include "bmap.h"
    +#include "dir.h"
    +#include "eaops.h"
    +#include "eattr.h"
    +#include "glock.h"
    +#include "inode.h"
    +#include "meta_io.h"
    +#include "ops_dentry.h"
    +#include "ops_inode.h"
    +#include "page.h"
    +#include "quota.h"
    +#include "rgrp.h"
    +#include "trans.h"
    +#include "unlinked.h"
    +
    +/**
    + * gfs2_create - Create a file
    + * @dir: The directory in which to create the file
    + * @dentry: The dentry of the new file
    + * @mode: The mode of the new file
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_create(struct inode *dir, struct dentry *dentry,
    + int mode, struct nameidata *nd)
    +{
    + struct gfs2_inode *dip = get_v2ip(dir), *ip;
    + struct gfs2_sbd *sdp = dip->i_sbd;
    + struct gfs2_holder ghs[2];
    + struct inode *inode;
    + int new = 1;
    + int error;
    +
    + atomic_inc(&sdp->sd_ops_inode);
    +
    + gfs2_holder_init(dip->i_gl, 0, 0, ghs);
    +
    + for (;;) {
    + error = gfs2_createi(ghs, &dentry->d_name, S_IFREG | mode);
    + if (!error) {
    + ip = get_gl2ip(ghs[1].gh_gl);
    + gfs2_trans_end(sdp);
    + if (dip->i_alloc->al_rgd)
    + gfs2_inplace_release(dip);
    + gfs2_quota_unlock(dip);
    + gfs2_alloc_put(dip);
    + gfs2_glock_dq_uninit_m(2, ghs);
    + break;
    + } else if (error != -EEXIST ||
    + (nd->intent.open.flags & O_EXCL)) {
    + gfs2_holder_uninit(ghs);
    + return error;
    + }
    +
    + error = gfs2_lookupi(dip, &dentry->d_name, 0, &ip);
    + if (!error) {
    + new = 0;
    + gfs2_holder_uninit(ghs);
    + break;
    + } else if (error != -ENOENT) {
    + gfs2_holder_uninit(ghs);
    + return error;
    + }
    + }
    +
    + inode = gfs2_ip2v(ip);
    + gfs2_inode_put(ip);
    +
    + if (!inode)
    + return -ENOMEM;
    +
    + d_instantiate(dentry, inode);
    + if (new)
    + mark_inode_dirty(inode);
    +
    + return 0;
    +}
    +
    +/**
    + * gfs2_lookup - Look up a filename in a directory and return its inode
    + * @dir: The directory inode
    + * @dentry: The dentry of the new inode
    + * @nd: passed from Linux VFS, ignored by us
    + *
    + * Called by the VFS layer. Lock dir and call gfs2_lookupi()
    + *
    + * Returns: errno
    + */
    +
    +static struct dentry *gfs2_lookup(struct inode *dir, struct dentry *dentry,
    + struct nameidata *nd)
    +{
    + struct gfs2_inode *dip = get_v2ip(dir), *ip;
    + struct gfs2_sbd *sdp = dip->i_sbd;
    + struct inode *inode = NULL;
    + int error;
    +
    + atomic_inc(&sdp->sd_ops_inode);
    +
    + if (!sdp->sd_args.ar_localcaching)
    + dentry->d_op = &gfs2_dops;
    +
    + error = gfs2_lookupi(dip, &dentry->d_name, 0, &ip);
    + if (!error) {
    + inode = gfs2_ip2v(ip);
    + gfs2_inode_put(ip);
    + if (!inode)
    + return ERR_PTR(-ENOMEM);
    +
    + } else if (error != -ENOENT)
    + return ERR_PTR(error);
    +
    + if (inode)
    + return d_splice_alias(inode, dentry);
    + d_add(dentry, inode);
    +
    + return NULL;
    +}
    +
    +/**
    + * gfs2_link - Link to a file
    + * @old_dentry: The inode to link
    + * @dir: Add link to this directory
    + * @dentry: The name of the link
    + *
    + * Link the inode in "old_dentry" into the directory "dir" with the
    + * name in "dentry".
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_link(struct dentry *old_dentry, struct inode *dir,
    + struct dentry *dentry)
    +{
    + struct gfs2_inode *dip = get_v2ip(dir);
    + struct gfs2_sbd *sdp = dip->i_sbd;
    + struct inode *inode = old_dentry->d_inode;
    + struct gfs2_inode *ip = get_v2ip(inode);
    + struct gfs2_holder ghs[2];
    + int alloc_required;
    + int error;
    +
    + atomic_inc(&sdp->sd_ops_inode);
    +
    + if (S_ISDIR(ip->i_di.di_mode))
    + return -EPERM;
    +
    + gfs2_holder_init(dip->i_gl, LM_ST_EXCLUSIVE, 0, ghs);
    + gfs2_holder_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, ghs + 1);
    +
    + error = gfs2_glock_nq_m(2, ghs);
    + if (error)
    + goto out;
    +
    + error = gfs2_repermission(dir, MAY_WRITE | MAY_EXEC, NULL);
    + if (error)
    + goto out_gunlock;
    +
    + error = gfs2_dir_search(dip, &dentry->d_name, NULL, NULL);
    + switch (error) {
    + case -ENOENT:
    + break;
    + case 0:
    + error = -EEXIST;
    + default:
    + goto out_gunlock;
    + }
    +
    + error = -EINVAL;
    + if (!dip->i_di.di_nlink)
    + goto out_gunlock;
    + error = -EFBIG;
    + if (dip->i_di.di_entries == (uint32_t)-1)
    + goto out_gunlock;
    + error = -EPERM;
    + if (IS_IMMUTABLE(inode) || IS_APPEND(inode))
    + goto out_gunlock;
    + error = -EINVAL;
    + if (!ip->i_di.di_nlink)
    + goto out_gunlock;
    + error = -EMLINK;
    + if (ip->i_di.di_nlink == (uint32_t)-1)
    + goto out_gunlock;
    +
    + error = gfs2_diradd_alloc_required(dip, &dentry->d_name,
    + &alloc_required);
    + if (error)
    + goto out_gunlock;
    +
    + if (alloc_required) {
    + struct gfs2_alloc *al = gfs2_alloc_get(dip);
    +
    + error = gfs2_quota_lock(dip, NO_QUOTA_CHANGE, NO_QUOTA_CHANGE);
    + if (error)
    + goto out_alloc;
    +
    + error = gfs2_quota_check(dip, dip->i_di.di_uid,
    + dip->i_di.di_gid);
    + if (error)
    + goto out_gunlock_q;
    +
    + al->al_requested = sdp->sd_max_dirres;
    +
    + error = gfs2_inplace_reserve(dip);
    + if (error)
    + goto out_gunlock_q;
    +
    + error = gfs2_trans_begin(sdp,
    + sdp->sd_max_dirres +
    + al->al_rgd->rd_ri.ri_length +
    + 2 * RES_DINODE + RES_STATFS +
    + RES_QUOTA, 0);
    + if (error)
    + goto out_ipres;
    + } else {
    + error = gfs2_trans_begin(sdp, 2 * RES_DINODE + RES_LEAF, 0);
    + if (error)
    + goto out_ipres;
    + }
    +
    + error = gfs2_dir_add(dip, &dentry->d_name, &ip->i_num,
    + IF2DT(ip->i_di.di_mode));
    + if (error)
    + goto out_end_trans;
    +
    + error = gfs2_change_nlink(ip, +1);
    +
    + out_end_trans:
    + gfs2_trans_end(sdp);
    +
    + out_ipres:
    + if (alloc_required)
    + gfs2_inplace_release(dip);
    +
    + out_gunlock_q:
    + if (alloc_required)
    + gfs2_quota_unlock(dip);
    +
    + out_alloc:
    + if (alloc_required)
    + gfs2_alloc_put(dip);
    +
    + out_gunlock:
    + gfs2_glock_dq_m(2, ghs);
    +
    + out:
    + gfs2_holder_uninit(ghs);
    + gfs2_holder_uninit(ghs + 1);
    +
    + if (!error) {
    + atomic_inc(&inode->i_count);
    + d_instantiate(dentry, inode);
    + mark_inode_dirty(inode);
    + }
    +
    + return error;
    +}
    +
    +/**
    + * gfs2_unlink - Unlink a file
    + * @dir: The inode of the directory containing the file to unlink
    + * @dentry: The file itself
    + *
    + * Unlink a file. Call gfs2_unlinki()
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_unlink(struct inode *dir, struct dentry *dentry)
    +{
    + struct gfs2_inode *dip = get_v2ip(dir);
    + struct gfs2_sbd *sdp = dip->i_sbd;
    + struct gfs2_inode *ip = get_v2ip(dentry->d_inode);
    + struct gfs2_unlinked *ul;
    + struct gfs2_holder ghs[2];
    + int error;
    +
    + atomic_inc(&sdp->sd_ops_inode);
    +
    + error = gfs2_unlinked_get(sdp, &ul);
    + if (error)
    + return error;
    +
    + gfs2_holder_init(dip->i_gl, LM_ST_EXCLUSIVE, 0, ghs);
    + gfs2_holder_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, ghs + 1);
    +
    + error = gfs2_glock_nq_m(2, ghs);
    + if (error)
    + goto out;
    +
    + error = gfs2_unlink_ok(dip, &dentry->d_name, ip);
    + if (error)
    + goto out_gunlock;
    +
    + error = gfs2_trans_begin(sdp, 2 * RES_DINODE + RES_LEAF +
    + RES_UNLINKED, 0);
    + if (error)
    + goto out_gunlock;
    +
    + error = gfs2_unlinki(dip, &dentry->d_name, ip,ul);
    +
    + gfs2_trans_end(sdp);
    +
    + out_gunlock:
    + gfs2_glock_dq_m(2, ghs);
    +
    + out:
    + gfs2_holder_uninit(ghs);
    + gfs2_holder_uninit(ghs + 1);
    +
    + gfs2_unlinked_put(sdp, ul);
    +
    + return error;
    +}
    +
    +/**
    + * gfs2_symlink - Create a symlink
    + * @dir: The directory to create the symlink in
    + * @dentry: The dentry to put the symlink in
    + * @symname: The thing which the link points to
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_symlink(struct inode *dir, struct dentry *dentry,
    + const char *symname)
    +{
    + struct gfs2_inode *dip = get_v2ip(dir), *ip;
    + struct gfs2_sbd *sdp = dip->i_sbd;
    + struct gfs2_holder ghs[2];
    + struct inode *inode;
    + struct buffer_head *dibh;
    + int size;
    + int error;
    +
    + atomic_inc(&sdp->sd_ops_inode);
    +
    + /* Must be stuffed with a null terminator for gfs2_follow_link() */
    + size = strlen(symname);
    + if (size > sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode) - 1)
    + return -ENAMETOOLONG;
    +
    + gfs2_holder_init(dip->i_gl, 0, 0, ghs);
    +
    + error = gfs2_createi(ghs, &dentry->d_name, S_IFLNK | S_IRWXUGO);
    + if (error) {
    + gfs2_holder_uninit(ghs);
    + return error;
    + }
    +
    + ip = get_gl2ip(ghs[1].gh_gl);
    +
    + ip->i_di.di_size = size;
    +
    + error = gfs2_meta_inode_buffer(ip, &dibh);
    +
    + if (!gfs2_assert_withdraw(sdp, !error)) {
    + gfs2_dinode_out(&ip->i_di, dibh->b_data);
    + memcpy(dibh->b_data + sizeof(struct gfs2_dinode), symname,
    + size);
    + brelse(dibh);
    + }
    +
    + gfs2_trans_end(sdp);
    + if (dip->i_alloc->al_rgd)
    + gfs2_inplace_release(dip);
    + gfs2_quota_unlock(dip);
    + gfs2_alloc_put(dip);
    +
    + gfs2_glock_dq_uninit_m(2, ghs);
    +
    + inode = gfs2_ip2v(ip);
    + gfs2_inode_put(ip);
    +
    + if (!inode)
    + return -ENOMEM;
    +
    + d_instantiate(dentry, inode);
    + mark_inode_dirty(inode);
    +
    + return 0;
    +}
    +
    +/**
    + * gfs2_mkdir - Make a directory
    + * @dir: The parent directory of the new one
    + * @dentry: The dentry of the new directory
    + * @mode: The mode of the new directory
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_mkdir(struct inode *dir, struct dentry *dentry, int mode)
    +{
    + struct gfs2_inode *dip = get_v2ip(dir), *ip;
    + struct gfs2_sbd *sdp = dip->i_sbd;
    + struct gfs2_holder ghs[2];
    + struct inode *inode;
    + struct buffer_head *dibh;
    + int error;
    +
    + atomic_inc(&sdp->sd_ops_inode);
    +
    + gfs2_holder_init(dip->i_gl, 0, 0, ghs);
    +
    + error = gfs2_createi(ghs, &dentry->d_name, S_IFDIR | mode);
    + if (error) {
    + gfs2_holder_uninit(ghs);
    + return error;
    + }
    +
    + ip = get_gl2ip(ghs[1].gh_gl);
    +
    + ip->i_di.di_nlink = 2;
    + ip->i_di.di_size = sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode);
    + ip->i_di.di_flags |= GFS2_DIF_JDATA;
    + ip->i_di.di_payload_format = GFS2_FORMAT_DE;
    + ip->i_di.di_entries = 2;
    +
    + error = gfs2_meta_inode_buffer(ip, &dibh);
    +
    + if (!gfs2_assert_withdraw(sdp, !error)) {
    + struct gfs2_dinode *di = (struct gfs2_dinode *)dibh->b_data;
    + struct gfs2_dirent *dent;
    +
    + gfs2_dirent_alloc(ip, dibh, 1, &dent);
    +
    + dent->de_inum = di->di_num; /* already GFS2 endian */
    + dent->de_hash = gfs2_disk_hash(".", 1);
    + dent->de_hash = cpu_to_le32(dent->de_hash);
    + dent->de_type = DT_DIR;
    + memcpy((char *) (dent + 1), ".", 1);
    + di->di_entries = cpu_to_le32(1);
    +
    + gfs2_dirent_alloc(ip, dibh, 2, &dent);
    +
    + gfs2_inum_out(&dip->i_num, (char *) &dent->de_inum);
    + dent->de_hash = gfs2_disk_hash("..", 2);
    + dent->de_hash = cpu_to_le32(dent->de_hash);
    + dent->de_type = DT_DIR;
    + memcpy((char *) (dent + 1), "..", 2);
    +
    + gfs2_dinode_out(&ip->i_di, (char *)di);
    +
    + brelse(dibh);
    + }
    +
    + error = gfs2_change_nlink(dip, +1);
    + gfs2_assert_withdraw(sdp, !error); /* dip already pinned */
    +
    + gfs2_trans_end(sdp);
    + if (dip->i_alloc->al_rgd)
    + gfs2_inplace_release(dip);
    + gfs2_quota_unlock(dip);
    + gfs2_alloc_put(dip);
    +
    + gfs2_glock_dq_uninit_m(2, ghs);
    +
    + inode = gfs2_ip2v(ip);
    + gfs2_inode_put(ip);
    +
    + if (!inode)
    + return -ENOMEM;
    +
    + d_instantiate(dentry, inode);
    + mark_inode_dirty(inode);
    +
    + return 0;
    +}
    +
    +/**
    + * gfs2_rmdir - Remove a directory
    + * @dir: The parent directory of the directory to be removed
    + * @dentry: The dentry of the directory to remove
    + *
    + * Remove a directory. Call gfs2_rmdiri()
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_rmdir(struct inode *dir, struct dentry *dentry)
    +{
    + struct gfs2_inode *dip = get_v2ip(dir);
    + struct gfs2_sbd *sdp = dip->i_sbd;
    + struct gfs2_inode *ip = get_v2ip(dentry->d_inode);
    + struct gfs2_unlinked *ul;
    + struct gfs2_holder ghs[2];
    + int error;
    +
    + atomic_inc(&sdp->sd_ops_inode);
    +
    + error = gfs2_unlinked_get(sdp, &ul);
    + if (error)
    + return error;
    +
    + gfs2_holder_init(dip->i_gl, LM_ST_EXCLUSIVE, 0, ghs);
    + gfs2_holder_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, ghs + 1);
    +
    + error = gfs2_glock_nq_m(2, ghs);
    + if (error)
    + goto out;
    +
    + error = gfs2_unlink_ok(dip, &dentry->d_name, ip);
    + if (error)
    + goto out_gunlock;
    +
    + if (ip->i_di.di_entries < 2) {
    + if (gfs2_consist_inode(ip))
    + gfs2_dinode_print(&ip->i_di);
    + error = -EIO;
    + goto out_gunlock;
    + }
    + if (ip->i_di.di_entries > 2) {
    + error = -ENOTEMPTY;
    + goto out_gunlock;
    + }
    +
    + error = gfs2_trans_begin(sdp, 2 * RES_DINODE + 3 * RES_LEAF +
    + RES_UNLINKED, 0);
    + if (error)
    + goto out_gunlock;
    +
    + error = gfs2_rmdiri(dip, &dentry->d_name, ip, ul);
    +
    + gfs2_trans_end(sdp);
    +
    + out_gunlock:
    + gfs2_glock_dq_m(2, ghs);
    +
    + out:
    + gfs2_holder_uninit(ghs);
    + gfs2_holder_uninit(ghs + 1);
    +
    + gfs2_unlinked_put(sdp, ul);
    +
    + return error;
    +}
    +
    +/**
    + * gfs2_mknod - Make a special file
    + * @dir: The directory in which the special file will reside
    + * @dentry: The dentry of the special file
    + * @mode: The mode of the special file
    + * @rdev: The device specification of the special file
    + *
    + */
    +
    +static int gfs2_mknod(struct inode *dir, struct dentry *dentry, int mode,
    + dev_t dev)
    +{
    + struct gfs2_inode *dip = get_v2ip(dir), *ip;
    + struct gfs2_sbd *sdp = dip->i_sbd;
    + struct gfs2_holder ghs[2];
    + struct inode *inode;
    + struct buffer_head *dibh;
    + uint32_t major = 0, minor = 0;
    + int error;
    +
    + atomic_inc(&sdp->sd_ops_inode);
    +
    + switch (mode & S_IFMT) {
    + case S_IFBLK:
    + case S_IFCHR:
    + major = MAJOR(dev);
    + minor = MINOR(dev);
    + break;
    + case S_IFIFO:
    + case S_IFSOCK:
    + break;
    + default:
    + return -EOPNOTSUPP;
    + };
    +
    + gfs2_holder_init(dip->i_gl, 0, 0, ghs);
    +
    + error = gfs2_createi(ghs, &dentry->d_name, mode);
    + if (error) {
    + gfs2_holder_uninit(ghs);
    + return error;
    + }
    +
    + ip = get_gl2ip(ghs[1].gh_gl);
    +
    + ip->i_di.di_major = major;
    + ip->i_di.di_minor = minor;
    +
    + error = gfs2_meta_inode_buffer(ip, &dibh);
    +
    + if (!gfs2_assert_withdraw(sdp, !error)) {
    + gfs2_dinode_out(&ip->i_di, dibh->b_data);
    + brelse(dibh);
    + }
    +
    + gfs2_trans_end(sdp);
    + if (dip->i_alloc->al_rgd)
    + gfs2_inplace_release(dip);
    + gfs2_quota_unlock(dip);
    + gfs2_alloc_put(dip);
    +
    + gfs2_glock_dq_uninit_m(2, ghs);
    +
    + inode = gfs2_ip2v(ip);
    + gfs2_inode_put(ip);
    +
    + if (!inode)
    + return -ENOMEM;
    +
    + d_instantiate(dentry, inode);
    + mark_inode_dirty(inode);
    +
    + return 0;
    +}
    +
    +/**
    + * gfs2_rename - Rename a file
    + * @odir: Parent directory of old file name
    + * @odentry: The old dentry of the file
    + * @ndir: Parent directory of new file name
    + * @ndentry: The new dentry of the file
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_rename(struct inode *odir, struct dentry *odentry,
    + struct inode *ndir, struct dentry *ndentry)
    +{
    + struct gfs2_inode *odip = get_v2ip(odir);
    + struct gfs2_inode *ndip = get_v2ip(ndir);
    + struct gfs2_inode *ip = get_v2ip(odentry->d_inode);
    + struct gfs2_inode *nip = NULL;
    + struct gfs2_sbd *sdp = odip->i_sbd;
    + struct gfs2_unlinked *ul;
    + struct gfs2_holder ghs[4], r_gh;
    + unsigned int num_gh;
    + int dir_rename = 0;
    + int alloc_required;
    + unsigned int x;
    + int error;
    +
    + atomic_inc(&sdp->sd_ops_inode);
    +
    + if (ndentry->d_inode) {
    + nip = get_v2ip(ndentry->d_inode);
    + if (ip == nip)
    + return 0;
    + }
    +
    + error = gfs2_unlinked_get(sdp, &ul);
    + if (error)
    + return error;
    +
    + /* Make sure we aren't trying to move a dirctory into it's subdir */
    +
    + if (S_ISDIR(ip->i_di.di_mode) && odip != ndip) {
    + dir_rename = 1;
    +
    + error = gfs2_glock_nq_init(sdp->sd_rename_gl,
    + LM_ST_EXCLUSIVE, 0,
    + &r_gh);
    + if (error)
    + goto out;
    +
    + error = gfs2_ok_to_move(ip, ndip);
    + if (error)
    + goto out_gunlock_r;
    + }
    +
    + gfs2_holder_init(odip->i_gl, LM_ST_EXCLUSIVE, 0, ghs);
    + gfs2_holder_init(ndip->i_gl, LM_ST_EXCLUSIVE, 0, ghs + 1);
    + gfs2_holder_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, ghs + 2);
    + num_gh = 3;
    +
    + if (nip)
    + gfs2_holder_init(nip->i_gl, LM_ST_EXCLUSIVE, 0, ghs + num_gh++);
    +
    + error = gfs2_glock_nq_m(num_gh, ghs);
    + if (error)
    + goto out_uninit;
    +
    + /* Check out the old directory */
    +
    + error = gfs2_unlink_ok(odip, &odentry->d_name, ip);
    + if (error)
    + goto out_gunlock;
    +
    + /* Check out the new directory */
    +
    + if (nip) {
    + error = gfs2_unlink_ok(ndip, &ndentry->d_name, nip);
    + if (error)
    + goto out_gunlock;
    +
    + if (S_ISDIR(nip->i_di.di_mode)) {
    + if (nip->i_di.di_entries < 2) {
    + if (gfs2_consist_inode(nip))
    + gfs2_dinode_print(&nip->i_di);
    + error = -EIO;
    + goto out_gunlock;
    + }
    + if (nip->i_di.di_entries > 2) {
    + error = -ENOTEMPTY;
    + goto out_gunlock;
    + }
    + }
    + } else {
    + error = gfs2_repermission(ndir, MAY_WRITE | MAY_EXEC, NULL);
    + if (error)
    + goto out_gunlock;
    +
    + error = gfs2_dir_search(ndip, &ndentry->d_name, NULL, NULL);
    + switch (error) {
    + case -ENOENT:
    + error = 0;
    + break;
    + case 0:
    + error = -EEXIST;
    + default:
    + goto out_gunlock;
    + };
    +
    + if (odip != ndip) {
    + if (!ndip->i_di.di_nlink) {
    + error = -EINVAL;
    + goto out_gunlock;
    + }
    + if (ndip->i_di.di_entries == (uint32_t)-1) {
    + error = -EFBIG;
    + goto out_gunlock;
    + }
    + if (S_ISDIR(ip->i_di.di_mode) &&
    + ndip->i_di.di_nlink == (uint32_t)-1) {
    + error = -EMLINK;
    + goto out_gunlock;
    + }
    + }
    + }
    +
    + /* Check out the dir to be renamed */
    +
    + if (dir_rename) {
    + error = gfs2_repermission(odentry->d_inode, MAY_WRITE, NULL);
    + if (error)
    + goto out_gunlock;
    + }
    +
    + error = gfs2_diradd_alloc_required(ndip, &ndentry->d_name,
    + &alloc_required);
    + if (error)
    + goto out_gunlock;
    +
    + if (alloc_required) {
    + struct gfs2_alloc *al = gfs2_alloc_get(ndip);
    +
    + error = gfs2_quota_lock(ndip, NO_QUOTA_CHANGE, NO_QUOTA_CHANGE);
    + if (error)
    + goto out_alloc;
    +
    + error = gfs2_quota_check(ndip, ndip->i_di.di_uid,
    + ndip->i_di.di_gid);
    + if (error)
    + goto out_gunlock_q;
    +
    + al->al_requested = sdp->sd_max_dirres;
    +
    + error = gfs2_inplace_reserve(ndip);
    + if (error)
    + goto out_gunlock_q;
    +
    + error = gfs2_trans_begin(sdp,
    + sdp->sd_max_dirres +
    + al->al_rgd->rd_ri.ri_length +
    + 4 * RES_DINODE + 4 * RES_LEAF +
    + RES_UNLINKED + RES_STATFS +
    + RES_QUOTA, 0);
    + if (error)
    + goto out_ipreserv;
    + } else {
    + error = gfs2_trans_begin(sdp, 4 * RES_DINODE +
    + 5 * RES_LEAF +
    + RES_UNLINKED, 0);
    + if (error)
    + goto out_gunlock;
    + }
    +
    + /* Remove the target file, if it exists */
    +
    + if (nip) {
    + if (S_ISDIR(nip->i_di.di_mode))
    + error = gfs2_rmdiri(ndip, &ndentry->d_name, nip, ul);
    + else
    + error = gfs2_unlinki(ndip, &ndentry->d_name, nip, ul);
    + if (error)
    + goto out_end_trans;
    + }
    +
    + if (dir_rename) {
    + struct qstr name;
    + name.len = 2;
    + name.name = "..";
    +
    + error = gfs2_change_nlink(ndip, +1);
    + if (error)
    + goto out_end_trans;
    + error = gfs2_change_nlink(odip, -1);
    + if (error)
    + goto out_end_trans;
    +
    + error = gfs2_dir_mvino(ip, &name, &ndip->i_num, DT_DIR);
    + if (error)
    + goto out_end_trans;
    + } else {
    + struct buffer_head *dibh;
    + error = gfs2_meta_inode_buffer(ip, &dibh);
    + if (error)
    + goto out_end_trans;
    + ip->i_di.di_ctime = get_seconds();
    + gfs2_trans_add_bh(ip->i_gl, dibh);
    + gfs2_dinode_out(&ip->i_di, dibh->b_data);
    + brelse(dibh);
    + }
    +
    + error = gfs2_dir_del(odip, &odentry->d_name);
    + if (error)
    + goto out_end_trans;
    +
    + error = gfs2_dir_add(ndip, &ndentry->d_name, &ip->i_num,
    + IF2DT(ip->i_di.di_mode));
    + if (error)
    + goto out_end_trans;
    +
    + out_end_trans:
    + gfs2_trans_end(sdp);
    +
    + out_ipreserv:
    + if (alloc_required)
    + gfs2_inplace_release(ndip);
    +
    + out_gunlock_q:
    + if (alloc_required)
    + gfs2_quota_unlock(ndip);
    +
    + out_alloc:
    + if (alloc_required)
    + gfs2_alloc_put(ndip);
    +
    + out_gunlock:
    + gfs2_glock_dq_m(num_gh, ghs);
    +
    + out_uninit:
    + for (x = 0; x < num_gh; x++)
    + gfs2_holder_uninit(ghs + x);
    +
    + out_gunlock_r:
    + if (dir_rename)
    + gfs2_glock_dq_uninit(&r_gh);
    +
    + out:
    + gfs2_unlinked_put(sdp, ul);
    +
    + return error;
    +}
    +
    +/**
    + * gfs2_readlink - Read the value of a symlink
    + * @dentry: the symlink
    + * @buf: the buffer to read the symlink data into
    + * @size: the size of the buffer
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_readlink(struct dentry *dentry, char __user *user_buf,
    + int user_size)
    +{
    + struct gfs2_inode *ip = get_v2ip(dentry->d_inode);
    + char array[GFS2_FAST_NAME_SIZE], *buf = array;
    + unsigned int len = GFS2_FAST_NAME_SIZE;
    + int error;
    +
    + atomic_inc(&ip->i_sbd->sd_ops_inode);
    +
    + error = gfs2_readlinki(ip, &buf, &len);
    + if (error)
    + return error;
    +
    + if (user_size > len - 1)
    + user_size = len - 1;
    +
    + if (copy_to_user(user_buf, buf, user_size))
    + error = -EFAULT;
    + else
    + error = user_size;
    +
    + if (buf != array)
    + kfree(buf);
    +
    + return error;
    +}
    +
    +/**
    + * gfs2_follow_link - Follow a symbolic link
    + * @dentry: The dentry of the link
    + * @nd: Data that we pass to vfs_follow_link()
    + *
    + * This can handle symlinks of any size. It is optimised for symlinks
    + * under GFS2_FAST_NAME_SIZE.
    + *
    + * Returns: 0 on success or error code
    + */
    +
    +static void *gfs2_follow_link(struct dentry *dentry, struct nameidata *nd)
    +{
    + struct gfs2_inode *ip = get_v2ip(dentry->d_inode);
    + char array[GFS2_FAST_NAME_SIZE], *buf = array;
    + unsigned int len = GFS2_FAST_NAME_SIZE;
    + int error;
    +
    + atomic_inc(&ip->i_sbd->sd_ops_inode);
    +
    + error = gfs2_readlinki(ip, &buf, &len);
    + if (!error) {
    + error = vfs_follow_link(nd, buf);
    + if (buf != array)
    + kfree(buf);
    + }
    +
    + return ERR_PTR(error);
    +}
    +
    +/**
    + * gfs2_permission -
    + * @inode:
    + * @mask:
    + * @nd: passed from Linux VFS, ignored by us
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_permission(struct inode *inode, int mask, struct nameidata *nd)
    +{
    + struct gfs2_inode *ip = get_v2ip(inode);
    + struct gfs2_holder i_gh;
    + int error;
    +
    + atomic_inc(&ip->i_sbd->sd_ops_inode);
    +
    + if (ip->i_vn == ip->i_gl->gl_vn)
    + return generic_permission(inode, mask, gfs2_check_acl);
    +
    + error = gfs2_glock_nq_init(ip->i_gl,
    + LM_ST_SHARED, LM_FLAG_ANY,
    + &i_gh);
    + if (!error) {
    + error = generic_permission(inode, mask, gfs2_check_acl_locked);
    + gfs2_glock_dq_uninit(&i_gh);
    + }
    +
    + return error;
    +}
    +
    +static int setattr_size(struct inode *inode, struct iattr *attr)
    +{
    + struct gfs2_inode *ip = get_v2ip(inode);
    + int error;
    +
    + if (attr->ia_size != ip->i_di.di_size) {
    + error = vmtruncate(inode, attr->ia_size);
    + if (error)
    + return error;
    + }
    +
    + error = gfs2_truncatei(ip, attr->ia_size, gfs2_truncator_page);
    + if (error)
    + return error;
    +
    + return error;
    +}
    +
    +static int setattr_chown(struct inode *inode, struct iattr *attr)
    +{
    + struct gfs2_inode *ip = get_v2ip(inode);
    + struct gfs2_sbd *sdp = ip->i_sbd;
    + struct buffer_head *dibh;
    + uint32_t ouid, ogid, nuid, ngid;
    + int error;
    +
    + ouid = ip->i_di.di_uid;
    + ogid = ip->i_di.di_gid;
    + nuid = attr->ia_uid;
    + ngid = attr->ia_gid;
    +
    + if (!(attr->ia_valid & ATTR_UID) || ouid == nuid)
    + ouid = nuid = NO_QUOTA_CHANGE;
    + if (!(attr->ia_valid & ATTR_GID) || ogid == ngid)
    + ogid = ngid = NO_QUOTA_CHANGE;
    +
    + gfs2_alloc_get(ip);
    +
    + error = gfs2_quota_lock(ip, nuid, ngid);
    + if (error)
    + goto out_alloc;
    +
    + if (ouid != NO_QUOTA_CHANGE || ogid != NO_QUOTA_CHANGE) {
    + error = gfs2_quota_check(ip, nuid, ngid);
    + if (error)
    + goto out_gunlock_q;
    + }
    +
    + error = gfs2_trans_begin(sdp, RES_DINODE + 2 * RES_QUOTA, 0);
    + if (error)
    + goto out_gunlock_q;
    +
    + error = gfs2_meta_inode_buffer(ip, &dibh);
    + if (error)
    + goto out_end_trans;
    +
    + error = inode_setattr(inode, attr);
    + gfs2_assert_warn(sdp, !error);
    + gfs2_inode_attr_out(ip);
    +
    + gfs2_trans_add_bh(ip->i_gl, dibh);
    + gfs2_dinode_out(&ip->i_di, dibh->b_data);
    + brelse(dibh);
    +
    + if (ouid != NO_QUOTA_CHANGE || ogid != NO_QUOTA_CHANGE) {
    + gfs2_quota_change(ip, -ip->i_di.di_blocks,
    + ouid, ogid);
    + gfs2_quota_change(ip, ip->i_di.di_blocks,
    + nuid, ngid);
    + }
    +
    + out_end_trans:
    + gfs2_trans_end(sdp);
    +
    + out_gunlock_q:
    + gfs2_quota_unlock(ip);
    +
    + out_alloc:
    + gfs2_alloc_put(ip);
    +
    + return error;
    +}
    +
    +/**
    + * gfs2_setattr - Change attributes on an inode
    + * @dentry: The dentry which is changing
    + * @attr: The structure describing the change
    + *
    + * The VFS layer wants to change one or more of an inodes attributes. Write
    + * that change out to disk.
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_setattr(struct dentry *dentry, struct iattr *attr)
    +{
    + struct inode *inode = dentry->d_inode;
    + struct gfs2_inode *ip = get_v2ip(inode);
    + struct gfs2_holder i_gh;
    + int error;
    +
    + atomic_inc(&ip->i_sbd->sd_ops_inode);
    +
    + error = gfs2_glock_nq_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, &i_gh);
    + if (error)
    + return error;
    +
    + error = -EPERM;
    + if (IS_IMMUTABLE(inode) || IS_APPEND(inode))
    + goto out;
    +
    + error = inode_change_ok(inode, attr);
    + if (error)
    + goto out;
    +
    + if (attr->ia_valid & ATTR_SIZE)
    + error = setattr_size(inode, attr);
    + else if (attr->ia_valid & (ATTR_UID | ATTR_GID))
    + error = setattr_chown(inode, attr);
    + else if ((attr->ia_valid & ATTR_MODE) && IS_POSIXACL(inode))
    + error = gfs2_acl_chmod(ip, attr);
    + else
    + error = gfs2_setattr_simple(ip, attr);
    +
    + out:
    + gfs2_glock_dq_uninit(&i_gh);
    +
    + if (!error)
    + mark_inode_dirty(inode);
    +
    + return error;
    +}
    +
    +/**
    + * gfs2_getattr - Read out an inode's attributes
    + * @mnt: ?
    + * @dentry: The dentry to stat
    + * @stat: The inode's stats
    + *
    + * Returns: errno
    + */
    +
    +static int gfs2_getattr(struct vfsmount *mnt, struct dentry *dentry,
    + struct kstat *stat)
    +{
    + struct inode *inode = dentry->d_inode;
    + struct gfs2_inode *ip = get_v2ip(inode);
    + struct gfs2_holder gh;
    + int error;
    +
    + atomic_inc(&ip->i_sbd->sd_ops_inode);
    +
    + error = gfs2_glock_nq_init(ip->i_gl, LM_ST_SHARED, LM_FLAG_ANY, &gh);
    + if (!error) {
    + generic_fillattr(inode, stat);
    + gfs2_glock_dq_uninit(&gh);
    + }
    +
    + return error;
    +}
    +
    +static int gfs2_setxattr(struct dentry *dentry, const char *name,
    + const void *data, size_t size, int flags)
    +{
    + struct gfs2_inode *ip = get_v2ip(dentry->d_inode);
    + struct gfs2_ea_request er;
    +
    + atomic_inc(&ip->i_sbd->sd_ops_inode);
    +
    + memset(&er, 0, sizeof(struct gfs2_ea_request));
    + er.er_type = gfs2_ea_name2type(name, &er.er_name);
    + if (er.er_type == GFS2_EATYPE_UNUSED)
    + return -EOPNOTSUPP;
    + er.er_data = (char *)data;
    + er.er_name_len = strlen(er.er_name);
    + er.er_data_len = size;
    + er.er_flags = flags;
    +
    + gfs2_assert_warn(ip->i_sbd, !(er.er_flags & GFS2_ERF_MODE));
    +
    + return gfs2_ea_set(ip, &er);
    +}
    +
    +static ssize_t gfs2_getxattr(struct dentry *dentry, const char *name,
    + void *data, size_t size)
    +{
    + struct gfs2_ea_request er;
    +
    + atomic_inc(&get_v2sdp(dentry->d_inode->i_sb)->sd_ops_inode);
    +
    + memset(&er, 0, sizeof(struct gfs2_ea_request));
    + er.er_type = gfs2_ea_name2type(name, &er.er_name);
    + if (er.er_type == GFS2_EATYPE_UNUSED)
    + return -EOPNOTSUPP;
    + er.er_data = data;
    + er.er_name_len = strlen(er.er_name);
    + er.er_data_len = size;
    +
    + return gfs2_ea_get(get_v2ip(dentry->d_inode), &er);
    +}
    +
    +static ssize_t gfs2_listxattr(struct dentry *dentry, char *buffer, size_t size)
    +{
    + struct gfs2_ea_request er;
    +
    + atomic_inc(&get_v2sdp(dentry->d_inode->i_sb)->sd_ops_inode);
    +
    + memset(&er, 0, sizeof(struct gfs2_ea_request));
    + er.er_data = (size) ? buffer : NULL;
    + er.er_data_len = size;
    +
    + return gfs2_ea_list(get_v2ip(dentry->d_inode), &er);
    +}
    +
    +static int gfs2_removexattr(struct dentry *dentry, const char *name)
    +{
    + struct gfs2_ea_request er;
    +
    + atomic_inc(&get_v2sdp(dentry->d_inode->i_sb)->sd_ops_inode);
    +
    + memset(&er, 0, sizeof(struct gfs2_ea_request));
    + er.er_type = gfs2_ea_name2type(name, &er.er_name);
    + if (er.er_type == GFS2_EATYPE_UNUSED)
    + return -EOPNOTSUPP;
    + er.er_name_len = strlen(er.er_name);
    +
    + return gfs2_ea_remove(get_v2ip(dentry->d_inode), &er);
    +}
    +
    +struct inode_operations gfs2_file_iops = {
    + .permission = gfs2_permission,
    + .setattr = gfs2_setattr,
    + .getattr = gfs2_getattr,
    + .setxattr = gfs2_setxattr,
    + .getxattr = gfs2_getxattr,
    + .listxattr = gfs2_listxattr,
    + .removexattr = gfs2_removexattr,
    +};
    +
    +struct inode_operations gfs2_dev_iops = {
    + .permission = gfs2_permission,
    + .setattr = gfs2_setattr,
    + .getattr = gfs2_getattr,
    + .setxattr = gfs2_setxattr,
    + .getxattr = gfs2_getxattr,
    + .listxattr = gfs2_listxattr,
    + .removexattr = gfs2_removexattr,
    +};
    +
    +struct inode_operations gfs2_dir_iops = {
    + .create = gfs2_create,
    + .lookup = gfs2_lookup,
    + .link = gfs2_link,
    + .unlink = gfs2_unlink,
    + .symlink = gfs2_symlink,
    + .mkdir = gfs2_mkdir,
    + .rmdir = gfs2_rmdir,
    + .mknod = gfs2_mknod,
    + .rename = gfs2_rename,
    + .permission = gfs2_permission,
    + .setattr = gfs2_setattr,
    + .getattr = gfs2_getattr,
    + .setxattr = gfs2_setxattr,
    + .getxattr = gfs2_getxattr,
    + .listxattr = gfs2_listxattr,
    + .removexattr = gfs2_removexattr,
    +};
    +
    +struct inode_operations gfs2_symlink_iops = {
    + .readlink = gfs2_readlink,
    + .follow_link = gfs2_follow_link,
    + .permission = gfs2_permission,
    + .setattr = gfs2_setattr,
    + .getattr = gfs2_getattr,
    + .setxattr = gfs2_setxattr,
    + .getxattr = gfs2_getxattr,
    + .listxattr = gfs2_listxattr,
    + .removexattr = gfs2_removexattr,
    +};
    +
    --- a/fs/gfs2/ops_inode.h 1969-12-31 17:00:00.000000000 -0700
    +++ b/fs/gfs2/ops_inode.h 2005-10-10 11:28:49.307785232 -0500
    @@ -0,0 +1,18 @@
    +/*
    + * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
    + * Copyright (C) 2004-2005 Red Hat, Inc. All rights reserved.
    + *
    + * This copyrighted material is made available to anyone wishing to use,
    + * modify, copy, or redistribute it subject to the terms and conditions
    + * of the GNU General Public License v.2.
    + */
    +
    +#ifndef __OPS_INODE_DOT_H__
    +#define __OPS_INODE_DOT_H__
    +
    +extern struct inode_operations gfs2_file_iops;
    +extern struct inode_operations gfs2_dir_iops;
    +extern struct inode_operations gfs2_symlink_iops;
    +extern struct inode_operations gfs2_dev_iops;
    +
    +#endif /* __OPS_INODE_DOT_H__ */
    -
    To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
    the body of a message to majordomo@vger.kernel.org
    More majordomo info at http://vger.kernel.org/majordomo-info.html
    Please read the FAQ at http://www.tux.org/lkml/


  • Next message: Greg KH: "Re: [PATCH 11/16] GFS: mount and tuning options"

    Relevant Pages

    • [PATCH 02c/13] GFS: core fs
      ... * modify, copy, or redistribute it subject to the terms and conditions ... * Check to make sure the lookup necessary to arrive at this inode from its ... +static struct dentry *gfs2_get_parent ... +extern struct export_operations gfs2_export_ops; ...
      (Linux-Kernel)
    • [PATCH 4/4] v9fs: implement 9p client interface that can be used outside vfs
      ... struct v9fs_session_info *v9ses) ... * @inode: ... static int __init init_v9fs ...
      (Linux-Kernel)
    • GFS2 Filesystem [5/16]
      ... superblock operations and inode operations ... * @offset: the offset ... The number of bytes read, errno on failure ... * @dentry: the dentry that points to the inode to sync ...
      (Linux-Kernel)
    • [PATCH 05/16] GFS2: File and inode operations
      ... superblock operations and inode operations ... filesystem flags. ... The number of bytes read, errno on failure ... * @dentry: the dentry that points to the inode to sync ...
      (Linux-Kernel)
    • [PATCH 9/9] clockpro-clockpro-stats.patch
      ... - use debugfs? ... files changed, 75 insertions(+) ... extern struct seq_operations zoneinfo_op; ... static int zoneinfo_open(struct inode *inode, ...
      (Linux-Kernel)