File: [Development] / xfs-linux-nodel / linux-2.6 / xfs_buf.h (download)
Revision 1.4, Tue Feb 26 13:53:10 2002 UTC (15 years, 8 months ago) by sandeen
Branch: MAIN
Changes since 1.3: +2 -1
lines
Merge of 2.4.x-xfs:slinx:112227a by lord.
Add pb_bmap_t to pagebuf_iozero arguments
|
/*
* Copyright (c) 2000 Silicon Graphics, Inc. All Rights Reserved.
*
* This program is free software; you can redistribute it and/or modify it
* under the terms of version 2 of the GNU General Public License as
* published by the Free Software Foundation.
*
* This program is distributed in the hope that it would be useful, but
* WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
*
* Further, this software is distributed without any warranty that it is
* free of the rightful claim of any third person regarding infringement
* or the like. Any license provided herein, whether implied or
* otherwise, applies only to this software file. Patent licenses, if
* any, provided herein do not apply to combinations of this program with
* other software, or any other product whatsoever.
*
* You should have received a copy of the GNU General Public License along
* with this program; if not, write the Free Software Foundation, Inc., 59
* Temple Place - Suite 330, Boston MA 02111-1307, USA.
*
* Contact information: Silicon Graphics, Inc., 1600 Amphitheatre Pkwy,
* Mountain View, CA 94043, or:
*
* http://www.sgi.com
*
* For further information regarding this notice, see:
*
* http://oss.sgi.com/projects/GenInfo/SGIGPLNoticeExplan/
*/
/*
* Written by Steve Lord, Jim Mostek, Russell Cattelan at SGI
*/
#ifndef __PAGE_BUF_H__
#define __PAGE_BUF_H__
#include <linux/version.h>
#include <linux/config.h>
#include <linux/list.h>
#include <linux/types.h>
#include <linux/spinlock.h>
#include <asm/system.h>
#include <linux/mm.h>
#include <linux/fs.h>
#include <linux/iobuf.h>
#include <linux/smp_lock.h>
#include <linux/uio.h>
/*
* Turn this on to get pagebuf lock ownership
#define PAGEBUF_LOCK_TRACKING
*/
/*
* Base types
*/
/* daddr must be signed since -1 is used for bmaps that are not yet allocated */
typedef loff_t page_buf_daddr_t;
#define PAGE_BUF_DADDR_NULL ((page_buf_daddr_t) (-1LL))
typedef size_t page_buf_dsize_t; /* size of buffer in blocks */
#define page_buf_ctob(pp) ((pp) * PAGE_CACHE_SIZE)
#define page_buf_btoc(dd) (((dd) + PAGE_CACHE_SIZE - 1) >> PAGE_CACHE_SHIFT)
#define page_buf_btoct(dd) ((dd) >> PAGE_CACHE_SHIFT)
#define page_buf_poff(aa) ((aa) & ~PAGE_CACHE_MASK)
typedef enum page_buf_rw_e {
PBRW_READ = 1, /* transfer into target memory */
PBRW_WRITE = 2, /* transfer from target memory */
PBRW_ZERO = 3 /* Zero target memory */
} page_buf_rw_t;
/*
* page_buf_bmap_t: File system I/O map
*
* The pbm_bn, pbm_offset and pbm_length fields are expressed in disk blocks.
* The pbm_length field specifies the size of the underlying backing store
* for the particular mapping.
*
* The pbm_bsize, pbm_size and pbm_delta fields are expressed in bytes and indicate
* the size of the mapping, the number of bytes that are valid to access
* (read or write), and the offset into the mapping, given the offset
* supplied to the file I/O map routine. pbm_delta is the offset of the
* desired data from the beginning of the mapping.
*
* When a request is made to read beyond the logical end of the object,
* pbm_size may be set to 0, but pbm_offset and pbm_length should be set to reflect
* the actual amount of underlying storage that has been allocated, if any.
*/
/* pbm_flags values */
typedef enum {
PBMF_EOF = 0x01, /* mapping contains EOF */
PBMF_HOLE = 0x02, /* mapping covers a hole */
PBMF_DELAY = 0x04, /* mapping covers delalloc region */
PBMF_UNWRITTEN = 0x20, /* mapping covers allocated */
/* but uninitialized XFS data */
} bmap_flags_t;
typedef struct page_buf_bmap_s {
page_buf_daddr_t pbm_bn; /* block number in file system */
kdev_t pbm_dev; /* device for I/O */
loff_t pbm_offset; /* byte offset of mapping in file */
size_t pbm_delta; /* offset of request into bmap */
size_t pbm_bsize; /* size of this mapping in bytes */
bmap_flags_t pbm_flags; /* options flags for mapping */
} page_buf_bmap_t;
typedef page_buf_bmap_t pb_bmap_t;
/*
* page_buf_t: Buffer structure for page cache-based buffers
*
* This buffer structure is used by the page cache buffer management routines
* to refer to an assembly of pages forming a logical buffer. The actual
* I/O is performed with kiobuf or buffer_head structures, as required by
* drivers, for drivers which do not understand this structure.
* The buffer structure is used on temporary basis only, and
* discarded when released.
*
* The real data storage is recorded in the page cache. Metadata is
* hashed to the inode for the block device on which the file system resides.
* File data is hashed to the inode for the file. Pages which are only
* partially filled with data have bits set in their block_map entry
* to indicate which disk blocks in the page are not valid.
*/
typedef enum page_buf_flags_e {
PBF_READ = (1 << 0), /* buffer intended for reading from device */
PBF_WRITE = (1 << 1), /* buffer intended for writing to device */
PBF_MAPPED = (1 << 2), /* buffer mapped (pb_addr valid) */
PBF_PARTIAL = (1 << 3), /* buffer partially read */
PBF_ASYNC = (1 << 4), /* initiator will not wait for completion */
PBF_NONE = (1 << 5), /* buffer not read at all */
PBF_DELWRI = (1 << 6), /* buffer has dirty pages */
PBF_FREED = (1 << 7), /* buffer has been freed and is invalid */
PBF_SYNC = (1 << 8), /* force updates to disk */
PBF_MAPPABLE = (1 << 9),/* use directly-addressable pages */
PBF_STALE = (1 << 10), /* buffer has been staled, do not find it */
PBF_FS_RESERVED_2 = (1 << 11), /* reserved for client use (UNUSED) */
PBF_RELEASE = (1 << 12),/* buffer to be released after I/O is done */
/* flags used only as arguments to access routines */
PBF_LOCK = (1 << 13), /* lock requested */
PBF_TRYLOCK = (1 << 14), /* lock requested, but do not wait */
PBF_ALLOCATE = (1 << 15), /* allocate all pages (UNUSED) */
PBF_FILE_ALLOCATE = (1 << 16), /* allocate all file space */
PBF_DONT_BLOCK = (1 << 17), /* do not block in current thread */
PBF_DIRECT = (1 << 18), /* direct I/O desired */
PBF_ENTER_PAGES = (1 << 21), /* create invalid pages for all */
/* pages in the range of the buffer */
/* not already associated with buffer */
/* flags used only internally */
_PBF_LOCKABLE = (1 << 19), /* page_buf_t may be locked */
_PBF_NEXT_KEY = (1 << 20), /* page_buf_t is a dummy used as a key */
_PBF_ALL_PAGES_MAPPED = (1 << 22),
/* all pages in rage are mapped */
_PBF_SOME_INVALID_PAGES = (1 << 23),
/* some mapped pages are not valid */
_PBF_ADDR_ALLOCATED = (1 << 24),
/* pb_addr space was allocated */
_PBF_MEM_ALLOCATED = (1 << 25),
/* pb_mem and underlying pages allocated */
PBF_GRIO = (1 << 26),
PBF_FORCEIO = (1 << 27),
PBF_FS_RESERVED_3 = (1 << 31) /* reserved (XFS use: XFS_B_STALE) */
} page_buf_flags_t;
#define PBF_UPDATE (PBF_READ | PBF_WRITE)
#define PBF_NOT_DONE(pb) (((pb)->pb_flags & (PBF_PARTIAL|PBF_NONE)) != 0)
#define PBF_DONE(pb) (((pb)->pb_flags & (PBF_PARTIAL|PBF_NONE)) == 0)
#if LINUX_VERSION_CODE < KERNEL_VERSION(2,4,13)
typedef struct pb_target {
kdev_t pbr_device;
unsigned short pbr_sector;
unsigned short pbr_blocksize;
unsigned int pbr_blocksize_bits;
struct address_space *pbr_addrspace;
avl_handle_t pbr_buffers;
spinlock_t pbr_lock;
} pb_target_t;
#define PB_ADDR_SPACE(pb) (&(pb)->pb_target->pbr_addrspace)
#else
typedef struct pb_target {
kdev_t pbr_device;
unsigned short pbr_sector;
unsigned short pbr_blocksize;
unsigned int pbr_blocksize_bits;
struct inode *pbr_inode;
avl_handle_t pbr_buffers;
spinlock_t pbr_lock;
} pb_target_t;
#define PB_ADDR_SPACE(pb) ((pb)->pb_target->pbr_inode->i_mapping)
#endif
struct page_buf_s;
typedef void (*page_buf_iodone_t)(struct page_buf_s *);
/* call-back function on I/O completion */
typedef void (*page_buf_relse_t)(struct page_buf_s *);
/* call-back function on I/O completion */
typedef int (*page_buf_bdstrat_t)(struct page_buf_s *);
typedef int (pagebuf_bmap_fn_t) (struct inode *, loff_t, ssize_t,
page_buf_bmap_t *, int, int *, int);
#define PB_PAGES 4
typedef struct page_buf_s {
struct list_head pb_list;
page_buf_flags_t pb_flags; /* status flags */
struct pb_target *pb_target; /* logical object */
unsigned int pb_hold; /* reference count */
page_buf_daddr_t pb_bn; /* block number for I/O */
kdev_t pb_dev;
loff_t pb_file_offset; /* offset in file */
size_t pb_buffer_length; /* size of buffer in bytes */
size_t pb_count_desired; /* desired transfer size */
void *pb_addr; /* virtual address of buffer */
page_buf_iodone_t pb_iodone; /* I/O completion function */
page_buf_relse_t pb_relse; /* releasing function */
page_buf_bdstrat_t pb_strat; /* pre-write function */
int pb_error; /* error code on I/O */
void *pb_fspriv;
void *pb_fspriv2;
void *pb_fspriv3;
int pb_page_count; /* size of page array */
int pb_locked; /* page array is locked */
unsigned int pb_offset; /* page offset in first page */
struct page **pb_pages; /* array of page pointers */
struct page *pb_page_array[PB_PAGES]; /* inline pages */
} page_buf_t;
typedef struct page_buf_private_s {
page_buf_t pb_common; /* public part of structure */
spinlock_t pb_lock;
struct semaphore pb_sema; /* semaphore for lockables */
unsigned long pb_flushtime; /* time to flush pagebuf */
atomic_t pb_io_remaining;/* #outstanding I/O requests */
struct semaphore pb_iodonesema; /* Semaphore for I/O waiters */
atomic_t pb_pin_count; /* pin count */
wait_queue_head_t pb_waiters; /* unpin waiters */
#ifdef PAGEBUF_LOCK_TRACKING
int pb_last_holder;
#endif /* PAGEBUF_LOCK_TRACKING */
} page_buf_private_t;
#define PBC(pb) (&((pb)->pb_common))
#define PBP(pb) ((page_buf_private_t *) (pb))
#define PB_SECTOR_SIZE(pb) ((pb)->pb_sector)
#ifdef PAGEBUF_LOCK_TRACKING
#define PB_SET_OWNER(pb) (PBP(pb)->pb_last_holder = current->pid)
#define PB_CLEAR_OWNER(pb) (PBP(pb)->pb_last_holder = -1)
#define PB_GET_OWNER(pb) (PBP(pb)->pb_last_holder)
#else
#define PB_SET_OWNER(pb)
#define PB_CLEAR_OWNER(pb)
#define PB_GET_OWNER(pb)
#endif
/* Tracing utilities for pagebuf */
typedef struct {
int event;
unsigned long pb;
page_buf_flags_t flags;
unsigned short hold;
unsigned short lock_value;
void *task;
void *misc;
void *ra;
loff_t offset;
size_t size;
} pagebuf_trace_t;
struct pagebuf_trace_buf {
pagebuf_trace_t *buf;
volatile int start;
volatile int end;
};
#define PB_TRACE_BUFSIZE 1024
#define CIRC_INC(i) (((i) + 1) & (PB_TRACE_BUFSIZE - 1))
typedef struct pagebuf_daemon {
int active;
spinlock_t pb_delwrite_lock;
struct list_head pb_delwrite_l;
int pb_delwri_cnt;
} pagebuf_daemon_t;
typedef struct pagebuf_marker_s {
struct list_head pb_list;
page_buf_flags_t pb_flags;
} pagebuf_marker_t;
/*
* Tunable pagebuf parameters
*/
#define P_PARAM 4
typedef union pagebuf_param {
struct {
ulong flush_interval; /* interval between runs of the
* delwri flush daemon. */
ulong age_buffer; /* time for buffer to age before
* we flush it. */
ulong max_dio; /* maximum pages locked in a dio call */
ulong debug; /* debug tracing on or off */
} p_un;
ulong data[P_PARAM];
} pagebuf_param_t;
enum {
PB_FLUSH_INT = 1,
PB_FLUSH_AGE = 2,
PB_DIO_MAX = 3,
PB_DEBUG = 4
};
extern pagebuf_param_t pb_params;
/*
* Pagebuf statistics
*/
struct pbstats {
u_int32_t pb_get;
u_int32_t pb_create;
u_int32_t pb_get_locked;
u_int32_t pb_get_locked_waited;
u_int32_t pb_busy_locked;
u_int32_t pb_miss_locked;
u_int32_t pb_page_alloc;
u_int32_t pb_page_found;
};
extern struct pbstats pbstats;
#define PB_STATS_INC(count) ( count ++ )
/*
* Page_buf_apply_t
*
* Type of function pointer supplied to pagebuf_segment_apply.
*/
typedef int (*page_buf_apply_t)( /* function to apply to segment */
page_buf_t *, /* buffer to examine */
loff_t, /* offset in file of segment */
struct page *, /* page (NULL if not in mem_map[]) */
size_t, /* offset in page */
size_t); /* length of segment */
/*
* page_buf module entry points
*/
/* Finding and Reading Buffers */
extern page_buf_t *pagebuf_find( /* find buffer for block if */
/* the block is in memory */
struct pb_target *, /* inode for block */
loff_t, /* starting offset of range */
size_t, /* length of range */
page_buf_flags_t); /* PBF_LOCK, PBF_ALWAYS_ALLOC */
extern page_buf_t *pagebuf_get( /* allocate a buffer */
struct pb_target *, /* inode for buffer */
loff_t, /* starting offset of range */
size_t, /* length of range */
page_buf_flags_t); /* PBF_LOCK, PBF_READ, PBF_ALLOCATE, */
/* PBF_ASYNC, PBF_SEQUENTIAL */
extern page_buf_t *pagebuf_lookup(
struct inode *,
loff_t, /* starting offset of range */
size_t, /* length of range */
int); /* PBF_ENTER_PAGES */
extern page_buf_t *pagebuf_get_empty( /* allocate pagebuf struct with */
/* no memory or disk address */
struct pb_target *); /* mount point "fake" inode */
extern page_buf_t *pagebuf_get_no_daddr(/* allocate pagebuf struct */
/* without disk address */
size_t len,
struct pb_target *); /* mount point "fake" inode */
extern int pagebuf_associate_memory(
page_buf_t *,
void *,
size_t);
extern void pagebuf_hold( /* increment reference count */
page_buf_t *); /* buffer to hold */
extern void pagebuf_readahead( /* read ahead into cache */
struct pb_target *, /* target for buffer (or NULL) */
loff_t, /* starting offset of range */
size_t, /* length of range */
int); /* additional read flags */
/* Writing and Releasing Buffers */
extern void pagebuf_free( /* deallocate a buffer */
page_buf_t *); /* buffer to deallocate */
extern void pagebuf_rele( /* release hold on a buffer */
page_buf_t *); /* buffer to release */
/* Locking and Unlocking Buffers */
extern int pagebuf_cond_lock( /* lock buffer, if not locked */
/* (returns -EBUSY if locked) */
page_buf_t *); /* buffer to lock */
extern int pagebuf_is_locked( /* test if buffer is locked */
/* (0 if unlocked, 1 if locked) */
page_buf_t *); /* buffer to test */
extern int pagebuf_lock_value( /* return count on lock */
page_buf_t *); /* buffer to check */
extern int pagebuf_lock( /* lock buffer */
page_buf_t *); /* buffer to lock */
extern int pagebuf_lock_disable( /* disable buffer locking */
struct pb_target *); /* inode for buffers */
extern struct pb_target *pagebuf_lock_enable(
kdev_t,
struct super_block *);
extern void pagebuf_target_blocksize(
pb_target_t *,
unsigned int); /* block size */
extern int pagebuf_target_clear(struct pb_target *);
extern void pagebuf_unlock( /* unlock buffer */
page_buf_t *); /* buffer to unlock */
/* Buffer Management for Inodes */
extern void pagebuf_flush( /* write buffered storage */
struct inode *, /* inode for range */
loff_t, /* first location in range */
page_buf_flags_t); /* PBF_ASYNC */
extern void pagebuf_inval( /* invalidate buffered data for */
/* inode */
struct inode *, /* inode for range */
loff_t, /* first location in range */
page_buf_flags_t); /* PBF_ASYNC */
extern void pagebuf_flushinval( /* write and invalidate */
/* buffered data for inode */
struct inode *, /* inode for range */
loff_t, /* first location in range */
page_buf_flags_t); /* PBF_ASYNC */
/* Buffer Utility Routines */
extern int pagebuf_geterror( /* return buffer error */
page_buf_t *); /* buffer */
extern void pagebuf_iodone( /* mark buffer I/O complete */
page_buf_t *); /* buffer to mark */
extern void pagebuf_ioerror( /* mark buffer in error (or not) */
page_buf_t *, /* buffer to mark */
int); /* error to store (0 if none) */
extern int pagebuf_iostart( /* start I/O on a buffer */
page_buf_t *, /* buffer to start */
page_buf_flags_t); /* PBF_LOCK, PBF_ASYNC, PBF_READ, */
/* PBF_WRITE, PBF_ALLOCATE, */
/* PBF_DELWRI, PBF_SEQUENTIAL, */
/* PBF_SYNC */
extern int pagebuf_iorequest( /* start real I/O */
page_buf_t *); /* buffer to convey to device */
/*
* pagebuf_iorequest is the core I/O request routine.
* It assumes that the buffer is well-formed and
* mapped and ready for physical I/O, unlike
* pagebuf_iostart() and pagebuf_iophysio(). Those
* routines call the inode pagebuf_ioinitiate routine to start I/O,
* if it is present, or else call pagebuf_iorequest()
* directly if the inode pagebuf_ioinitiate routine is not present.
*/
extern int pagebuf_iowait( /* wait for buffer I/O done */
page_buf_t *); /* buffer to wait on */
extern int pagebuf_iozero( /* zero contents of buffer */
struct inode *, /* inode owning pages */
page_buf_t *, /* buffer to zero */
off_t, /* offset in buffer */
size_t, /* size of data to zero */
loff_t, /* last permissible isize value */
pb_bmap_t *); /* pointer to pagebuf bmap */
extern caddr_t pagebuf_offset(page_buf_t *, off_t);
extern int pagebuf_segment( /* return next segment of buffer */
page_buf_t *, /* buffer to examine */
loff_t *, /* offset in buffer of next */
/* segment (updated) */
struct page **, /* page (updated) */
/* (NULL if not in mem_map[]) */
size_t *, /* offset in page (updated) */
size_t *, /* length of segment (updated) */
page_buf_flags_t); /* PBF_ALWAYS_ALLOC */
extern int pagebuf_iomove( /* move data in/out of pagebuf */
page_buf_t *, /* buffer to manipulate */
off_t, /* starting buffer offset */
size_t, /* length in buffer */
caddr_t, /* data pointer */
page_buf_rw_t); /* direction */
extern int pagebuf_segment_apply( /* apply function to segments */
page_buf_apply_t, /* function to call */
page_buf_t *); /* buffer to examine */
/* Pinning Buffer Storage in Memory */
extern void pagebuf_pin( /* pin buffer in memory */
page_buf_t *); /* buffer to pin */
extern void pagebuf_unpin( /* unpin buffered data */
page_buf_t *); /* buffer to unpin */
extern void pagebuf_wait_unpin( /* wait for buffer to be unpinned */
page_buf_t *); /* buffer for which to wait */
extern int pagebuf_ispin( page_buf_t *); /* check if pagebuf is pinned */
/* Reading and writing pages */
extern ssize_t pagebuf_direct_file_read(
struct file *, /* file to read */
char *, /* buffer address */
size_t, /* size of buffer */
loff_t *, /* file offset to use and update */
pagebuf_bmap_fn_t); /* bmap function */
/*
* pagebuf_direct_file_read reads data from the specified file
* at the loff_t referenced, updating the loff_t to point after the
* data read and returning the count of bytes read.
* The data is read into the supplied buffer, up to a maximum of the
* specified size.
*/
extern ssize_t pagebuf_generic_file_write(
struct file *, /* file to write */
char *, /* buffer address */
size_t, /* size of buffer */
loff_t *, /* file offset to use and update */
pagebuf_bmap_fn_t); /* bmap function */
/*
* pagebuf_generic_file_write writes data from the specified file
* at the loff_t referenced, updating the loff_t to point after the
* data written and returning the count of bytes written.
* The data is written from the supplied buffer, up to a maximum of the
* specified size. Normally all of the data is written, unless there
* is an error.
*/
extern int pagebuf_read_full_page( /* read a page via pagebuf */
struct file *, /* file to read */
struct page *, /* page to read */
pagebuf_bmap_fn_t); /* bmap function */
extern int pagebuf_write_full_page( /* write a page via pagebuf */
struct page *, /* page to write */
pagebuf_bmap_fn_t); /* bmap function */
extern int pagebuf_commit_write(
struct file *, /* file to write */
struct page *, /* page to write */
unsigned, /* from offset */
unsigned); /* to offset */
extern int pagebuf_prepare_write(
struct file *, /* file to write */
struct page *, /* page to write */
unsigned, /* from offset */
unsigned, /* to offset */
pagebuf_bmap_fn_t); /* bmap function */
extern void pagebuf_delwri_queue(page_buf_t *, int);
extern void pagebuf_delwri_dequeue(page_buf_t *);
#define PBDF_WAIT 0x01
#define PBDF_TRYLOCK 0x02
extern void pagebuf_delwri_flush(
struct pb_target *,
unsigned long,
int *);
extern int _pagebuf_get_object(
struct pb_target *,
loff_t,
size_t,
page_buf_flags_t,
page_buf_t **);
extern void _pagebuf_free_object( /* deallocate a buffer */
page_buf_t *, /* buffer to deallocate */
unsigned long); /* interrupt flags */
extern int _pagebuf_lookup_pages(
page_buf_t *,
struct address_space *,
page_buf_flags_t);
extern int pagebuf_locking_init(void);
extern void pagebuf_locking_terminate(void);
extern int pagebuf_init(void);
extern void pagebuf_terminate(void);
static __inline__ int __pagebuf_iorequest(page_buf_t *pb)
{
if (pb->pb_strat)
return pb->pb_strat(pb);
return pagebuf_iorequest(pb);
}
extern size_t pagebuf_max_direct(void);
#undef assert
#ifdef PAGEBUF_DEBUG
# define assert(expr) \
if (!(expr)) { \
printk("Assertion failed: %s\n%s::%s line %d\n",\
#expr,__FILE__,__FUNCTION__,__LINE__); \
BUG(); \
}
#else
# define assert(x) do { } while (0)
#endif
#ifndef STATIC
# define STATIC static
#endif
#endif /* __PAGE_BUF_H__ */