*
* Lustre Lite I/O Page Cache
*
- * Copyright (C) 2002 Cluster File Systems, Inc.
+ * Copyright (C) 2002 Cluster File Systems, Inc.
*/
#include <linux/config.h>
#include <linux/lustre_mds.h>
#include <linux/lustre_lite.h>
-
-#if (LINUX_VERSION_CODE < KERNEL_VERSION(2,4,10))
-/*
- * Add a page to the dirty page list.
- */
-void __set_page_dirty(struct page *page)
-{
- struct address_space *mapping;
- spinlock_t *pg_lock;
-
- pg_lock = PAGECACHE_LOCK(page);
- spin_lock(pg_lock);
-
- mapping = page->mapping;
- spin_lock(&mapping->page_lock);
-
- list_del(&page->list);
- list_add(&page->list, &mapping->dirty_pages);
-
- spin_unlock(&mapping->page_lock);
- spin_unlock(pg_lock);
-
- if (mapping->host)
- mark_inode_dirty_pages(mapping->host);
-}
-#else
-/*
- * Add a page to the dirty page list.
- */
-void set_page_dirty(struct page *page)
-{
- if (!test_and_set_bit(PG_dirty, &page->flags)) {
- struct address_space *mapping = page->mapping;
-
- if (mapping) {
- spin_lock(&pagecache_lock);
- list_del(&page->list);
- list_add(&page->list, &mapping->dirty_pages);
- spin_unlock(&pagecache_lock);
-
- if (mapping->host)
- mark_inode_dirty_pages(mapping->host);
- }
- }
-}
-#endif
-
-inline struct obdo * ll_oa_from_inode(struct inode *inode, unsigned long valid)
-{
- struct ll_inode_info *oinfo = ll_i2info(inode);
- struct obdo *oa = obdo_alloc();
- if ( !oa ) {
- CERROR("no memory to allocate obdo!\n");
- return NULL;
- }
- oa->o_valid = valid;
-
- if ( valid & OBD_MD_FLID )
- oa->o_id = oinfo->lli_objid;
- if ( valid & OBD_MD_FLATIME )
- oa->o_atime = inode->i_atime;
- if ( valid & OBD_MD_FLMTIME )
- oa->o_mtime = inode->i_mtime;
- if ( valid & OBD_MD_FLCTIME )
- oa->o_ctime = inode->i_ctime;
- if ( valid & OBD_MD_FLSIZE )
- oa->o_size = inode->i_size;
- if ( valid & OBD_MD_FLBLOCKS ) /* allocation of space */
- oa->o_blocks = inode->i_blocks;
- if ( valid & OBD_MD_FLBLKSZ )
- oa->o_blksize = inode->i_blksize;
- if ( valid & OBD_MD_FLMODE )
- oa->o_mode = inode->i_mode;
- if ( valid & OBD_MD_FLUID )
- oa->o_uid = inode->i_uid;
- if ( valid & OBD_MD_FLGID )
- oa->o_gid = inode->i_gid;
- if ( valid & OBD_MD_FLFLAGS )
- oa->o_flags = inode->i_flags;
- if ( valid & OBD_MD_FLNLINK )
- oa->o_nlink = inode->i_nlink;
- if ( valid & OBD_MD_FLGENER )
- oa->o_generation = inode->i_generation;
-
- CDEBUG(D_INFO, "src inode %ld, dst obdo %ld valid 0x%08lx\n",
- inode->i_ino, (long)oa->o_id, valid);
-#if 0
- /* this will transfer metadata for the logical object to
- the oa: that metadata could contain the constituent objects
- */
- if (ll_has_inline(inode)) {
- CDEBUG(D_INODE, "copying inline data from inode to obdo\n");
- memcpy(oa->o_inline, oinfo->lli_inline, OBD_INLINESZ);
- oa->o_obdflags |= OBD_FL_INLINEDATA;
- oa->o_valid |= OBD_MD_FLINLINE;
- }
-#endif
- return oa;
-} /* ll_oa_from_inode */
-
+#include <linux/lustre_lib.h>
-/*
- * Remove page from dirty list
- */
-void __set_page_clean(struct page *page)
-{
- struct address_space *mapping = page->mapping;
- struct inode *inode;
-
- if (!mapping)
- return;
-
- list_del(&page->list);
- list_add(&page->list, &mapping->clean_pages);
-
- inode = mapping->host;
- if (list_empty(&mapping->dirty_pages)) {
- CDEBUG(D_INODE, "inode clean\n");
- inode->i_state &= ~I_DIRTY_PAGES;
- }
- EXIT;
-}
-
/* SYNCHRONOUS I/O to object storage for an inode */
static int ll_brw(int rw, struct inode *inode, struct page *page, int create)
{
- obd_count num_obdo = 1;
- obd_count bufs_per_obdo = 1;
- struct obdo *oa;
- obd_size count = PAGE_SIZE;
- obd_off offset = ((obd_off)page->index) << PAGE_SHIFT;
- obd_flag flags = create ? OBD_BRW_CREATE : 0;
- int err;
+ struct ll_inode_info *lli = ll_i2info(inode);
+ struct lov_stripe_md *md = lli->lli_smd;
+ struct brw_page pg;
+ int err;
+ struct io_cb_data *cbd = ll_init_cb();
ENTRY;
- oa = ll_oa_from_inode(inode, OBD_MD_FLNOTOBD);
- if (!oa)
+ if (!cbd)
RETURN(-ENOMEM);
- err = obd_brw(rw, ll_i2obdconn(inode), num_obdo, &oa, &bufs_per_obdo,
- &page, &count, &offset, &flags);
+ pg.pg = page;
+ pg.count = PAGE_SIZE;
+ pg.off = ((obd_off)page->index) << PAGE_SHIFT;
+ pg.flag = create ? OBD_BRW_CREATE : 0;
+
+ err = obd_brw(rw, ll_i2obdconn(inode), md, 1, &pg, ll_sync_io_cb, cbd);
- obdo_free(oa);
RETURN(err);
} /* ll_brw */
-extern void set_page_clean(struct page *);
-
-
-
/* returns the page unlocked, but with a reference */
static int ll_readpage(struct file *file, struct page *page)
{
struct inode *inode = page->mapping->host;
+ obd_off offset = ((obd_off)page->index) << PAGE_SHIFT;
int rc = 0;
ENTRY;
if (!PageLocked(page))
LBUG();
- if (((inode->i_size + PAGE_CACHE_SIZE -1)>>PAGE_SHIFT) <= page->index) {
- memset(kmap(page), 0, PAGE_CACHE_SIZE);
+ if (inode->i_size <= offset) {
+ memset(kmap(page), 0, PAGE_SIZE);
kunmap(page);
GOTO(readpage_out, rc);
}
obd_off offset = ((obd_off)page->index) << PAGE_SHIFT;
int rc = 0;
char *addr;
- ENTRY;
-
+ ENTRY;
+
addr = kmap(page);
if (!PageLocked(page))
LBUG();
if (Page_Uptodate(page))
GOTO(prepare_done, rc);
- if (offset + from >= inode->i_size) {
- memset(addr, 0, PAGE_SIZE);
- GOTO(prepare_done, rc);
- }
-
/* We're completely overwriting an existing page, so _don't_ set it up
* to date until commit_write */
- if (from == 0 && to == PAGE_SIZE) {
- memset(addr, 0, PAGE_SIZE);
+ if (from == 0 && to == PAGE_SIZE)
RETURN(0);
+
+ /* We are writing to a new page, no need to read old data */
+ if (inode->i_size <= offset) {
+ memset(addr, 0, PAGE_SIZE);
+ goto prepare_done;
}
rc = ll_brw(OBD_BRW_READ, inode, page, 0);
int err;
ENTRY;
- LBUG();
-
if (!PageLocked(page))
LBUG();
} else {
CERROR("ll_brw failure %d\n", err);
}
- UnlockPage(page);
+ unlock_page(page);
RETURN(err);
}
+
/* SYNCHRONOUS I/O to object storage for an inode -- object attr will be updated
* too */
static int ll_commit_write(struct file *file, struct page *page,
{
int create = 1;
struct inode *inode = page->mapping->host;
- obd_count num_obdo = 1;
- obd_count bufs_per_obdo = 1;
- struct obdo *oa;
- obd_size count = to;
- obd_off offset = (((obd_off)page->index) << PAGE_SHIFT);
- obd_flag flags = create ? OBD_BRW_CREATE : 0;
- int err;
- struct iattr iattr;
+ struct ll_inode_info *lli = ll_i2info(inode);
+ struct lov_stripe_md *md = lli->lli_smd;
+ struct brw_page pg;
+ int err;
+ loff_t size;
+ struct io_cb_data *cbd = ll_init_cb();
+
+ pg.pg = page;
+ pg.count = to;
+ pg.off = (((obd_off)page->index) << PAGE_SHIFT);
+ pg.flag = create ? OBD_BRW_CREATE : 0;
ENTRY;
- oa = ll_oa_from_inode(inode, OBD_MD_FLNOTOBD);
- if (! oa )
+ if (!cbd)
RETURN(-ENOMEM);
SetPageUptodate(page);
if (!PageLocked(page))
LBUG();
- CDEBUG(D_INODE, "commit_page writing (at %d) to %d, count %Ld\n",
- from, to, (unsigned long long)count);
+ CDEBUG(D_INODE, "commit_page writing (at %d) to %d, count %Ld\n",
+ from, to, (unsigned long long)pg.count);
- err = obd_brw(OBD_BRW_WRITE, ll_i2obdconn(inode), num_obdo, &oa,
- &bufs_per_obdo, &page, &count, &offset, &flags);
+ err = obd_brw(OBD_BRW_WRITE, ll_i2obdconn(inode), md,
+ 1, &pg, ll_sync_io_cb, cbd);
kunmap(page);
- if (offset + to > inode->i_size) {
- iattr.ia_valid = ATTR_SIZE;
- iattr.ia_size = offset + to;
- /* do NOT truncate */
- inode->i_size = offset + to;
-#if 0
- err = ll_inode_setattr(inode, &iattr, 0);
- if (err) {
- CERROR("failed - %d.\n", err);
- err = -EIO;
- }
-#endif
- }
+ size = pg.off + pg.count;
+ /* do NOT truncate when writing in the middle of a file */
+ if (size > inode->i_size)
+ inode->i_size = size;
- obdo_free(oa);
RETURN(err);
} /* ll_commit_write */
void ll_truncate(struct inode *inode)
{
- struct obdo *oa;
+ struct obdo oa = {0};
+ struct lov_stripe_md *md = ll_i2info(inode)->lli_smd;
+ struct lustre_handle *lockhs = NULL;
int err;
ENTRY;
- oa = ll_oa_from_inode(inode, OBD_MD_FLNOTOBD);
- if ( !oa ) {
- CERROR("no memory to allocate obdo!\n");
- return;
- }
-
- CDEBUG(D_INFO, "calling punch for %ld (%Lu bytes at 0)\n",
- (long)oa->o_id, (unsigned long long)oa->o_size);
- err = obd_punch(ll_i2obdconn(inode), oa, oa->o_size, 0);
- obdo_free(oa);
+ if (!md) {
+ /* object not yet allocated */
+ inode->i_mtime = inode->i_ctime = CURRENT_TIME;
+ return;
+ }
+
+ oa.o_id = md->lmd_object_id;
+ oa.o_size = inode->i_size;
+
+ CDEBUG(D_INFO, "calling punch for %ld (all bytes after %Ld)\n",
+ (long)oa.o_id, (unsigned long long)oa.o_size);
+ err = ll_size_lock(inode, md, oa.o_size, LCK_PW, &lockhs);
if (err) {
- CERROR("obd_truncate fails (%d)\n", err);
+ CERROR("ll_size_lock failed: %d\n", err);
+ /* FIXME: What to do here? It's too late to back out... */
+ LBUG();
}
+
+ oa.o_valid = OBD_MD_FLID;
+ /* truncate == punch to/from start from/to end:
+ set end to -1 for that. */
+ err = obd_punch(ll_i2obdconn(inode), &oa, md, inode->i_size,
+ 0xffffffffffffffff);
+ if (err)
+ CERROR("obd_truncate fails (%d)\n", err);
+ else
+ obdo_to_inode(inode, &oa, oa.o_valid);
+
+ err = ll_size_unlock(inode, md, LCK_PW, lockhs);
+ if (err)
+ CERROR("ll_size_unlock failed: %d\n", err);
+
EXIT;
return;
} /* ll_truncate */
-int ll_direct_IO(int rw, struct inode * inode, struct kiobuf * iobuf, unsigned long blocknr, int blocksize)
+int ll_direct_IO(int rw, struct inode *inode, struct kiobuf *iobuf,
+ unsigned long blocknr, int blocksize)
{
- int i;
- obd_count num_obdo = 1;
obd_count bufs_per_obdo = iobuf->nr_pages;
- struct obdo *oa = NULL;
+ struct ll_inode_info *lli = ll_i2info(inode);
+ struct lov_stripe_md *md = lli->lli_smd;
+ struct brw_page *pga;
+ int rc = 0;
+ int i;
+ struct io_cb_data *cbd = ll_init_cb();
+
+ ENTRY;
+ if (!cbd)
+ RETURN(-ENOMEM);
+
+ if (blocksize != PAGE_SIZE) {
+ CERROR("direct_IO blocksize != PAGE_SIZE\n");
+ return -EINVAL;
+ }
+
+ OBD_ALLOC(pga, sizeof(*pga) * bufs_per_obdo);
+ if (!pga)
+ GOTO(out, rc = -ENOMEM);
+
+ /* NB: we can't use iobuf->maplist[i]->index for the offset
+ * instead of "blocknr" because ->index contains garbage.
+ */
+ for (i = 0; i < bufs_per_obdo; i++, blocknr++) {
+ pga[i].pg = iobuf->maplist[i];
+ pga[i].count = PAGE_SIZE;
+ pga[i].off = (obd_off)blocknr << PAGE_SHIFT;
+ pga[i].flag = OBD_BRW_CREATE;
+ }
+
+ if (!md || !md->lmd_object_id)
+ GOTO(out, rc = -ENOMEM);
+
+ rc = obd_brw(rw == WRITE ? OBD_BRW_WRITE : OBD_BRW_READ,
+ ll_i2obdconn(inode), md, bufs_per_obdo, pga,
+ ll_sync_io_cb, cbd);
+ if (rc == 0)
+ rc = bufs_per_obdo * PAGE_SIZE;
+
+out:
+ OBD_FREE(pga, sizeof(*pga) * bufs_per_obdo);
+ RETURN(rc);
+}
+
+
+int ll_flush_inode_pages(struct inode * inode)
+{
+ obd_count bufs_per_obdo = 0;
obd_size *count = NULL;
obd_off *offset = NULL;
obd_flag *flags = NULL;
ENTRY;
- OBD_ALLOC(count, sizeof(obd_size) * bufs_per_obdo);
- if (!count)
- GOTO(out, err=-ENOMEM);
+ spin_lock(&pagecache_lock);
+
+ spin_unlock(&pagecache_lock);
- OBD_ALLOC(offset, sizeof(obd_off) * bufs_per_obdo);
- if (!offset)
- GOTO(out, err=-ENOMEM);
- OBD_ALLOC(flags, sizeof(obd_flag) * bufs_per_obdo);
- if (!flags)
- GOTO(out, err=-ENOMEM);
+ OBD_ALLOC(count, sizeof(*count) * bufs_per_obdo);
+ OBD_ALLOC(offset, sizeof(*offset) * bufs_per_obdo);
+ OBD_ALLOC(flags, sizeof(*flags) * bufs_per_obdo);
+ if (!count || !offset || !flags)
+ GOTO(out, err=-ENOMEM);
- for (i = 0 ; i < bufs_per_obdo ; i++) {
+#if 0
+ for (i = 0 ; i < bufs_per_obdo ; i++) {
count[i] = PAGE_SIZE;
offset[i] = ((obd_off)(iobuf->maplist[i])->index) << PAGE_SHIFT;
flags[i] = OBD_BRW_CREATE;
}
- oa = ll_oa_from_inode(inode, OBD_MD_FLNOTOBD);
- if (!oa)
- RETURN(-ENOMEM);
-
- err = obd_brw(rw, ll_i2obdconn(inode), num_obdo, &oa, &bufs_per_obdo,
- iobuf->maplist, count, offset, flags);
+ err = obd_brw(OBD_BRW_WRITE, ll_i2obdconn(inode),
+ ll_i2info(inode)->lli_smd, bufs_per_obdo,
+ iobuf->maplist, count, offset, flags, NULL, NULL);
if (err == 0)
- err = bufs_per_obdo * PAGE_SIZE;
-
+ err = bufs_per_obdo * 4096;
+#endif
out:
- if (oa)
- obdo_free(oa);
- if (flags)
- OBD_FREE(flags, sizeof(obd_flag) * bufs_per_obdo);
- if (count)
- OBD_FREE(count, sizeof(obd_count) * bufs_per_obdo);
- if (offset)
- OBD_FREE(offset, sizeof(obd_off) * bufs_per_obdo);
+ OBD_FREE(flags, sizeof(*flags) * bufs_per_obdo);
+ OBD_FREE(count, sizeof(*count) * bufs_per_obdo);
+ OBD_FREE(offset, sizeof(*offset) * bufs_per_obdo);
RETURN(err);
}
direct_IO: ll_direct_IO,
#endif
sync_page: block_sync_page,
- prepare_write: ll_prepare_write,
+ prepare_write: ll_prepare_write,
commit_write: ll_commit_write,
bmap: NULL
};