Commit 77605e41 authored by Jinshan Xiong's avatar Jinshan Xiong Committed by Greg Kroah-Hartman

staging/lustre/clio: add pages into writeback cache in batches

in ll_write_end(), instead of adding the page into writeback
cache directly, it will be held in a page list. After enough
pages have been collected, issue them all with cio_commit_async().
Signed-off-by: default avatarJinshan Xiong <jinshan.xiong@intel.com>
Reviewed-on: http://review.whamcloud.com/7893
Intel-bug-id: https://jira.hpdd.intel.com/browse/LU-3321Reviewed-by: default avatarBobi Jam <bobijam@gmail.com>
Reviewed-by: default avatarLai Siyao <lai.siyao@intel.com>
Signed-off-by: default avatarOleg Drokin <green@linuxhacker.ru>
Signed-off-by: default avatarGreg Kroah-Hartman <gregkh@linuxfoundation.org>
parent 3c361c1c
...@@ -1019,26 +1019,6 @@ struct cl_page_operations { ...@@ -1019,26 +1019,6 @@ struct cl_page_operations {
*/ */
int (*cpo_make_ready)(const struct lu_env *env, int (*cpo_make_ready)(const struct lu_env *env,
const struct cl_page_slice *slice); const struct cl_page_slice *slice);
/**
* Announce that this page is to be written out
* opportunistically, that is, page is dirty, it is not
* necessary to start write-out transfer right now, but
* eventually page has to be written out.
*
* Main caller of this is the write path (see
* vvp_io_commit_write()), using this method to build a
* "transfer cache" from which large transfers are then
* constructed by the req-formation engine.
*
* \todo XXX it would make sense to add page-age tracking
* semantics here, and to oblige the req-formation engine to
* send the page out not later than it is too old.
*
* \see cl_page_cache_add()
*/
int (*cpo_cache_add)(const struct lu_env *env,
const struct cl_page_slice *slice,
struct cl_io *io);
} io[CRT_NR]; } io[CRT_NR];
/** /**
* Tell transfer engine that only [to, from] part of a page should be * Tell transfer engine that only [to, from] part of a page should be
...@@ -2023,6 +2003,8 @@ struct cl_io_slice { ...@@ -2023,6 +2003,8 @@ struct cl_io_slice {
struct list_head cis_linkage; struct list_head cis_linkage;
}; };
typedef void (*cl_commit_cbt)(const struct lu_env *, struct cl_io *,
struct cl_page *);
/** /**
* Per-layer io operations. * Per-layer io operations.
* \see vvp_io_ops, lov_io_ops, lovsub_io_ops, osc_io_ops * \see vvp_io_ops, lov_io_ops, lovsub_io_ops, osc_io_ops
...@@ -2106,7 +2088,7 @@ struct cl_io_operations { ...@@ -2106,7 +2088,7 @@ struct cl_io_operations {
void (*cio_fini)(const struct lu_env *env, void (*cio_fini)(const struct lu_env *env,
const struct cl_io_slice *slice); const struct cl_io_slice *slice);
} op[CIT_OP_NR]; } op[CIT_OP_NR];
struct {
/** /**
* Submit pages from \a queue->c2_qin for IO, and move * Submit pages from \a queue->c2_qin for IO, and move
* successfully submitted pages into \a queue->c2_qout. Return * successfully submitted pages into \a queue->c2_qout. Return
...@@ -2119,7 +2101,15 @@ struct cl_io_operations { ...@@ -2119,7 +2101,15 @@ struct cl_io_operations {
const struct cl_io_slice *slice, const struct cl_io_slice *slice,
enum cl_req_type crt, enum cl_req_type crt,
struct cl_2queue *queue); struct cl_2queue *queue);
} req_op[CRT_NR]; /**
* Queue async page for write.
* The difference between cio_submit and cio_queue is that
* cio_submit is for urgent request.
*/
int (*cio_commit_async)(const struct lu_env *env,
const struct cl_io_slice *slice,
struct cl_page_list *queue, int from, int to,
cl_commit_cbt cb);
/** /**
* Read missing page. * Read missing page.
* *
...@@ -2131,31 +2121,6 @@ struct cl_io_operations { ...@@ -2131,31 +2121,6 @@ struct cl_io_operations {
int (*cio_read_page)(const struct lu_env *env, int (*cio_read_page)(const struct lu_env *env,
const struct cl_io_slice *slice, const struct cl_io_slice *slice,
const struct cl_page_slice *page); const struct cl_page_slice *page);
/**
* Prepare write of a \a page. Called bottom-to-top by a top-level
* cl_io_operations::op[CIT_WRITE]::cio_start() to prepare page for
* get data from user-level buffer.
*
* \pre io->ci_type == CIT_WRITE
*
* \see vvp_io_prepare_write(), lov_io_prepare_write(),
* osc_io_prepare_write().
*/
int (*cio_prepare_write)(const struct lu_env *env,
const struct cl_io_slice *slice,
const struct cl_page_slice *page,
unsigned from, unsigned to);
/**
*
* \pre io->ci_type == CIT_WRITE
*
* \see vvp_io_commit_write(), lov_io_commit_write(),
* osc_io_commit_write().
*/
int (*cio_commit_write)(const struct lu_env *env,
const struct cl_io_slice *slice,
const struct cl_page_slice *page,
unsigned from, unsigned to);
/** /**
* Optional debugging helper. Print given io slice. * Optional debugging helper. Print given io slice.
*/ */
...@@ -3044,15 +3009,14 @@ int cl_io_lock_alloc_add(const struct lu_env *env, struct cl_io *io, ...@@ -3044,15 +3009,14 @@ int cl_io_lock_alloc_add(const struct lu_env *env, struct cl_io *io,
struct cl_lock_descr *descr); struct cl_lock_descr *descr);
int cl_io_read_page(const struct lu_env *env, struct cl_io *io, int cl_io_read_page(const struct lu_env *env, struct cl_io *io,
struct cl_page *page); struct cl_page *page);
int cl_io_prepare_write(const struct lu_env *env, struct cl_io *io,
struct cl_page *page, unsigned from, unsigned to);
int cl_io_commit_write(const struct lu_env *env, struct cl_io *io,
struct cl_page *page, unsigned from, unsigned to);
int cl_io_submit_rw(const struct lu_env *env, struct cl_io *io, int cl_io_submit_rw(const struct lu_env *env, struct cl_io *io,
enum cl_req_type iot, struct cl_2queue *queue); enum cl_req_type iot, struct cl_2queue *queue);
int cl_io_submit_sync(const struct lu_env *env, struct cl_io *io, int cl_io_submit_sync(const struct lu_env *env, struct cl_io *io,
enum cl_req_type iot, struct cl_2queue *queue, enum cl_req_type iot, struct cl_2queue *queue,
long timeout); long timeout);
int cl_io_commit_async(const struct lu_env *env, struct cl_io *io,
struct cl_page_list *queue, int from, int to,
cl_commit_cbt cb);
int cl_io_is_going(const struct lu_env *env); int cl_io_is_going(const struct lu_env *env);
/** /**
...@@ -3108,6 +3072,12 @@ static inline struct cl_page *cl_page_list_last(struct cl_page_list *plist) ...@@ -3108,6 +3072,12 @@ static inline struct cl_page *cl_page_list_last(struct cl_page_list *plist)
return list_entry(plist->pl_pages.prev, struct cl_page, cp_batch); return list_entry(plist->pl_pages.prev, struct cl_page, cp_batch);
} }
static inline struct cl_page *cl_page_list_first(struct cl_page_list *plist)
{
LASSERT(plist->pl_nr > 0);
return list_entry(plist->pl_pages.next, struct cl_page, cp_batch);
}
/** /**
* Iterate over pages in a page list. * Iterate over pages in a page list.
*/ */
...@@ -3124,9 +3094,14 @@ void cl_page_list_init(struct cl_page_list *plist); ...@@ -3124,9 +3094,14 @@ void cl_page_list_init(struct cl_page_list *plist);
void cl_page_list_add(struct cl_page_list *plist, struct cl_page *page); void cl_page_list_add(struct cl_page_list *plist, struct cl_page *page);
void cl_page_list_move(struct cl_page_list *dst, struct cl_page_list *src, void cl_page_list_move(struct cl_page_list *dst, struct cl_page_list *src,
struct cl_page *page); struct cl_page *page);
void cl_page_list_move_head(struct cl_page_list *dst, struct cl_page_list *src,
struct cl_page *page);
void cl_page_list_splice(struct cl_page_list *list, struct cl_page_list *head); void cl_page_list_splice(struct cl_page_list *list, struct cl_page_list *head);
void cl_page_list_del(const struct lu_env *env, struct cl_page_list *plist,
struct cl_page *page);
void cl_page_list_disown(const struct lu_env *env, void cl_page_list_disown(const struct lu_env *env,
struct cl_io *io, struct cl_page_list *plist); struct cl_io *io, struct cl_page_list *plist);
void cl_page_list_fini(const struct lu_env *env, struct cl_page_list *plist);
void cl_2queue_init(struct cl_2queue *queue); void cl_2queue_init(struct cl_2queue *queue);
void cl_2queue_disown(const struct lu_env *env, void cl_2queue_disown(const struct lu_env *env,
......
...@@ -91,6 +91,12 @@ struct ccc_io { ...@@ -91,6 +91,12 @@ struct ccc_io {
struct { struct {
enum ccc_setattr_lock_type cui_local_lock; enum ccc_setattr_lock_type cui_local_lock;
} setattr; } setattr;
struct {
struct cl_page_list cui_queue;
unsigned long cui_written;
int cui_from;
int cui_to;
} write;
} u; } u;
/** /**
* True iff io is processing glimpse right now. * True iff io is processing glimpse right now.
......
...@@ -1120,6 +1120,9 @@ ll_file_io_generic(const struct lu_env *env, struct vvp_io_args *args, ...@@ -1120,6 +1120,9 @@ ll_file_io_generic(const struct lu_env *env, struct vvp_io_args *args,
struct cl_io *io; struct cl_io *io;
ssize_t result; ssize_t result;
CDEBUG(D_VFSTRACE, "file: %s, type: %d ppos: %llu, count: %zd\n",
file->f_path.dentry->d_name.name, iot, *ppos, count);
restart: restart:
io = ccc_env_thread_io(env); io = ccc_env_thread_io(env);
ll_io_init(io, file, iot == CIT_WRITE); ll_io_init(io, file, iot == CIT_WRITE);
...@@ -1144,9 +1147,8 @@ ll_file_io_generic(const struct lu_env *env, struct vvp_io_args *args, ...@@ -1144,9 +1147,8 @@ ll_file_io_generic(const struct lu_env *env, struct vvp_io_args *args,
goto out; goto out;
} }
write_mutex_locked = 1; write_mutex_locked = 1;
} else if (iot == CIT_READ) {
down_read(&lli->lli_trunc_sem);
} }
down_read(&lli->lli_trunc_sem);
break; break;
case IO_SPLICE: case IO_SPLICE:
vio->u.splice.cui_pipe = args->u.splice.via_pipe; vio->u.splice.cui_pipe = args->u.splice.via_pipe;
...@@ -1157,10 +1159,10 @@ ll_file_io_generic(const struct lu_env *env, struct vvp_io_args *args, ...@@ -1157,10 +1159,10 @@ ll_file_io_generic(const struct lu_env *env, struct vvp_io_args *args,
LBUG(); LBUG();
} }
result = cl_io_loop(env, io); result = cl_io_loop(env, io);
if (args->via_io_subtype == IO_NORMAL)
up_read(&lli->lli_trunc_sem);
if (write_mutex_locked) if (write_mutex_locked)
mutex_unlock(&lli->lli_write_mutex); mutex_unlock(&lli->lli_write_mutex);
else if (args->via_io_subtype == IO_NORMAL && iot == CIT_READ)
up_read(&lli->lli_trunc_sem);
} else { } else {
/* cl_io_rw_init() handled IO */ /* cl_io_rw_init() handled IO */
result = io->ci_result; result = io->ci_result;
...@@ -1197,6 +1199,7 @@ ll_file_io_generic(const struct lu_env *env, struct vvp_io_args *args, ...@@ -1197,6 +1199,7 @@ ll_file_io_generic(const struct lu_env *env, struct vvp_io_args *args,
fd->fd_write_failed = true; fd->fd_write_failed = true;
} }
} }
CDEBUG(D_VFSTRACE, "iot: %d, result: %zd\n", iot, result);
return result; return result;
} }
......
...@@ -697,8 +697,6 @@ int ll_md_blocking_ast(struct ldlm_lock *, struct ldlm_lock_desc *, ...@@ -697,8 +697,6 @@ int ll_md_blocking_ast(struct ldlm_lock *, struct ldlm_lock_desc *,
struct dentry *ll_splice_alias(struct inode *inode, struct dentry *de); struct dentry *ll_splice_alias(struct inode *inode, struct dentry *de);
/* llite/rw.c */ /* llite/rw.c */
int ll_prepare_write(struct file *, struct page *, unsigned from, unsigned to);
int ll_commit_write(struct file *, struct page *, unsigned from, unsigned to);
int ll_writepage(struct page *page, struct writeback_control *wbc); int ll_writepage(struct page *page, struct writeback_control *wbc);
int ll_writepages(struct address_space *, struct writeback_control *wbc); int ll_writepages(struct address_space *, struct writeback_control *wbc);
int ll_readpage(struct file *file, struct page *page); int ll_readpage(struct file *file, struct page *page);
...@@ -706,6 +704,9 @@ void ll_readahead_init(struct inode *inode, struct ll_readahead_state *ras); ...@@ -706,6 +704,9 @@ void ll_readahead_init(struct inode *inode, struct ll_readahead_state *ras);
int ll_readahead(const struct lu_env *env, struct cl_io *io, int ll_readahead(const struct lu_env *env, struct cl_io *io,
struct ll_readahead_state *ras, struct address_space *mapping, struct ll_readahead_state *ras, struct address_space *mapping,
struct cl_page_list *queue, int flags); struct cl_page_list *queue, int flags);
int vvp_io_write_commit(const struct lu_env *env, struct cl_io *io);
struct ll_cl_context *ll_cl_init(struct file *file, struct page *vmpage);
void ll_cl_fini(struct ll_cl_context *lcc);
extern const struct address_space_operations ll_aops; extern const struct address_space_operations ll_aops;
...@@ -1476,4 +1477,7 @@ int ll_layout_restore(struct inode *inode); ...@@ -1476,4 +1477,7 @@ int ll_layout_restore(struct inode *inode);
int ll_xattr_init(void); int ll_xattr_init(void);
void ll_xattr_fini(void); void ll_xattr_fini(void);
int ll_page_sync_io(const struct lu_env *env, struct cl_io *io,
struct cl_page *page, enum cl_req_type crt);
#endif /* LLITE_INTERNAL_H */ #endif /* LLITE_INTERNAL_H */
...@@ -63,7 +63,7 @@ ...@@ -63,7 +63,7 @@
* Finalizes cl-data before exiting typical address_space operation. Dual to * Finalizes cl-data before exiting typical address_space operation. Dual to
* ll_cl_init(). * ll_cl_init().
*/ */
static void ll_cl_fini(struct ll_cl_context *lcc) void ll_cl_fini(struct ll_cl_context *lcc)
{ {
struct lu_env *env = lcc->lcc_env; struct lu_env *env = lcc->lcc_env;
struct cl_io *io = lcc->lcc_io; struct cl_io *io = lcc->lcc_io;
...@@ -84,8 +84,7 @@ static void ll_cl_fini(struct ll_cl_context *lcc) ...@@ -84,8 +84,7 @@ static void ll_cl_fini(struct ll_cl_context *lcc)
* Initializes common cl-data at the typical address_space operation entry * Initializes common cl-data at the typical address_space operation entry
* point. * point.
*/ */
static struct ll_cl_context *ll_cl_init(struct file *file, struct ll_cl_context *ll_cl_init(struct file *file, struct page *vmpage)
struct page *vmpage, int create)
{ {
struct ll_cl_context *lcc; struct ll_cl_context *lcc;
struct lu_env *env; struct lu_env *env;
...@@ -96,7 +95,7 @@ static struct ll_cl_context *ll_cl_init(struct file *file, ...@@ -96,7 +95,7 @@ static struct ll_cl_context *ll_cl_init(struct file *file,
int refcheck; int refcheck;
int result = 0; int result = 0;
clob = ll_i2info(vmpage->mapping->host)->lli_clob; clob = ll_i2info(file_inode(file))->lli_clob;
LASSERT(clob); LASSERT(clob);
env = cl_env_get(&refcheck); env = cl_env_get(&refcheck);
...@@ -111,62 +110,18 @@ static struct ll_cl_context *ll_cl_init(struct file *file, ...@@ -111,62 +110,18 @@ static struct ll_cl_context *ll_cl_init(struct file *file,
cio = ccc_env_io(env); cio = ccc_env_io(env);
io = cio->cui_cl.cis_io; io = cio->cui_cl.cis_io;
if (!io && create) { lcc->lcc_io = io;
struct inode *inode = vmpage->mapping->host; if (!io) {
loff_t pos; struct inode *inode = file_inode(file);
if (inode_trylock(inode)) { CERROR("%s: " DFID " no active IO, please file a ticket.\n",
inode_unlock((inode)); ll_get_fsname(inode->i_sb, NULL, 0),
PFID(ll_inode2fid(inode)));
dump_stack();
/* this is too bad. Someone is trying to write the
* page w/o holding inode mutex. This means we can
* add dirty pages into cache during truncate
*/
CERROR("Proc %s is dirtying page w/o inode lock, this will break truncate\n",
current->comm);
dump_stack();
LBUG();
return ERR_PTR(-EIO);
}
/*
* Loop-back driver calls ->prepare_write().
* methods directly, bypassing file system ->write() operation,
* so cl_io has to be created here.
*/
io = ccc_env_thread_io(env);
ll_io_init(io, file, 1);
/* No lock at all for this kind of IO - we can't do it because
* we have held page lock, it would cause deadlock.
* XXX: This causes poor performance to loop device - One page
* per RPC.
* In order to get better performance, users should use
* lloop driver instead.
*/
io->ci_lockreq = CILR_NEVER;
pos = vmpage->index << PAGE_CACHE_SHIFT;
/* Create a temp IO to serve write. */
result = cl_io_rw_init(env, io, CIT_WRITE, pos, PAGE_CACHE_SIZE);
if (result == 0) {
cio->cui_fd = LUSTRE_FPRIVATE(file);
cio->cui_iter = NULL;
result = cl_io_iter_init(env, io);
if (result == 0) {
result = cl_io_lock(env, io);
if (result == 0)
result = cl_io_start(env, io);
}
} else
result = io->ci_result;
}
lcc->lcc_io = io;
if (!io)
result = -EIO; result = -EIO;
if (result == 0) { }
if (result == 0 && vmpage) {
struct cl_page *page; struct cl_page *page;
LASSERT(io->ci_state == CIS_IO_GOING); LASSERT(io->ci_state == CIS_IO_GOING);
...@@ -185,99 +140,9 @@ static struct ll_cl_context *ll_cl_init(struct file *file, ...@@ -185,99 +140,9 @@ static struct ll_cl_context *ll_cl_init(struct file *file,
lcc = ERR_PTR(result); lcc = ERR_PTR(result);
} }
CDEBUG(D_VFSTRACE, "%lu@"DFID" -> %d %p %p\n",
vmpage->index, PFID(lu_object_fid(&clob->co_lu)), result,
env, io);
return lcc; return lcc;
} }
static struct ll_cl_context *ll_cl_get(void)
{
struct ll_cl_context *lcc;
struct lu_env *env;
int refcheck;
env = cl_env_get(&refcheck);
LASSERT(!IS_ERR(env));
lcc = &vvp_env_info(env)->vti_io_ctx;
LASSERT(env == lcc->lcc_env);
LASSERT(current == lcc->lcc_cookie);
cl_env_put(env, &refcheck);
/* env has got in ll_cl_init, so it is still usable. */
return lcc;
}
/**
* ->prepare_write() address space operation called by generic_file_write()
* for every page during write.
*/
int ll_prepare_write(struct file *file, struct page *vmpage, unsigned from,
unsigned to)
{
struct ll_cl_context *lcc;
int result;
lcc = ll_cl_init(file, vmpage, 1);
if (!IS_ERR(lcc)) {
struct lu_env *env = lcc->lcc_env;
struct cl_io *io = lcc->lcc_io;
struct cl_page *page = lcc->lcc_page;
cl_page_assume(env, io, page);
result = cl_io_prepare_write(env, io, page, from, to);
if (result == 0) {
/*
* Add a reference, so that page is not evicted from
* the cache until ->commit_write() is called.
*/
cl_page_get(page);
lu_ref_add(&page->cp_reference, "prepare_write",
current);
} else {
cl_page_unassume(env, io, page);
ll_cl_fini(lcc);
}
/* returning 0 in prepare assumes commit must be called
* afterwards
*/
} else {
result = PTR_ERR(lcc);
}
return result;
}
int ll_commit_write(struct file *file, struct page *vmpage, unsigned from,
unsigned to)
{
struct ll_cl_context *lcc;
struct lu_env *env;
struct cl_io *io;
struct cl_page *page;
int result = 0;
lcc = ll_cl_get();
env = lcc->lcc_env;
page = lcc->lcc_page;
io = lcc->lcc_io;
LASSERT(cl_page_is_owned(page, io));
LASSERT(from <= to);
if (from != to) /* handle short write case. */
result = cl_io_commit_write(env, io, page, from, to);
if (cl_page_is_owned(page, io))
cl_page_unassume(env, io, page);
/*
* Release reference acquired by ll_prepare_write().
*/
lu_ref_del(&page->cp_reference, "prepare_write", current);
cl_page_put(env, page);
ll_cl_fini(lcc);
return result;
}
static void ll_ra_stats_inc_sbi(struct ll_sb_info *sbi, enum ra_stat which); static void ll_ra_stats_inc_sbi(struct ll_sb_info *sbi, enum ra_stat which);
/** /**
...@@ -1251,7 +1116,7 @@ int ll_readpage(struct file *file, struct page *vmpage) ...@@ -1251,7 +1116,7 @@ int ll_readpage(struct file *file, struct page *vmpage)
struct ll_cl_context *lcc; struct ll_cl_context *lcc;
int result; int result;
lcc = ll_cl_init(file, vmpage, 0); lcc = ll_cl_init(file, vmpage);
if (!IS_ERR(lcc)) { if (!IS_ERR(lcc)) {
struct lu_env *env = lcc->lcc_env; struct lu_env *env = lcc->lcc_env;
struct cl_io *io = lcc->lcc_io; struct cl_io *io = lcc->lcc_io;
...@@ -1273,3 +1138,28 @@ int ll_readpage(struct file *file, struct page *vmpage) ...@@ -1273,3 +1138,28 @@ int ll_readpage(struct file *file, struct page *vmpage)
} }
return result; return result;
} }
int ll_page_sync_io(const struct lu_env *env, struct cl_io *io,
struct cl_page *page, enum cl_req_type crt)
{
struct cl_2queue *queue;
int result;
LASSERT(io->ci_type == CIT_READ || io->ci_type == CIT_WRITE);
queue = &io->ci_queue;
cl_2queue_init_page(queue, page);
result = cl_io_submit_sync(env, io, crt, queue, 0);
LASSERT(cl_page_is_owned(page, io));
if (crt == CRT_READ)
/*
* in CRT_WRITE case page is left locked even in case of
* error.
*/
cl_page_list_disown(env, io, &queue->c2_qin);
cl_2queue_fini(env, queue);
return result;
}
...@@ -462,57 +462,211 @@ static ssize_t ll_direct_IO_26(struct kiocb *iocb, struct iov_iter *iter, ...@@ -462,57 +462,211 @@ static ssize_t ll_direct_IO_26(struct kiocb *iocb, struct iov_iter *iter,
inode_unlock(inode); inode_unlock(inode);
if (tot_bytes > 0) { if (tot_bytes > 0) {
if (iov_iter_rw(iter) == WRITE) { struct ccc_io *cio = ccc_env_io(env);
struct lov_stripe_md *lsm;
/* no commit async for direct IO */
lsm = ccc_inode_lsm_get(inode); cio->u.write.cui_written += tot_bytes;
LASSERT(lsm);
lov_stripe_lock(lsm);
obd_adjust_kms(ll_i2dtexp(inode), lsm, file_offset, 0);
lov_stripe_unlock(lsm);
ccc_inode_lsm_put(inode, lsm);
}
} }
cl_env_put(env, &refcheck); cl_env_put(env, &refcheck);
return tot_bytes ? : result; return tot_bytes ? : result;
} }
/**
* Prepare partially written-to page for a write.
*/
static int ll_prepare_partial_page(const struct lu_env *env, struct cl_io *io,
struct cl_page *pg)
{
struct cl_object *obj = io->ci_obj;
struct cl_attr *attr = ccc_env_thread_attr(env);
loff_t offset = cl_offset(obj, pg->cp_index);
int result;
cl_object_attr_lock(obj);
result = cl_object_attr_get(env, obj, attr);
cl_object_attr_unlock(obj);
if (result == 0) {
struct ccc_page *cp;
cp = cl2ccc_page(cl_page_at(pg, &vvp_device_type));
/*
* If are writing to a new page, no need to read old data.
* The extent locking will have updated the KMS, and for our
* purposes here we can treat it like i_size.
*/
if (attr->cat_kms <= offset) {
char *kaddr = kmap_atomic(cp->cpg_page);
memset(kaddr, 0, cl_page_size(obj));
kunmap_atomic(kaddr);
} else if (cp->cpg_defer_uptodate) {
cp->cpg_ra_used = 1;
} else {
result = ll_page_sync_io(env, io, pg, CRT_READ);
}
}
return result;
}
static int ll_write_begin(struct file *file, struct address_space *mapping, static int ll_write_begin(struct file *file, struct address_space *mapping,
loff_t pos, unsigned len, unsigned flags, loff_t pos, unsigned len, unsigned flags,
struct page **pagep, void **fsdata) struct page **pagep, void **fsdata)
{ {
struct ll_cl_context *lcc;
struct lu_env *env;
struct cl_io *io;
struct cl_page *page;
struct cl_object *clob = ll_i2info(mapping->host)->lli_clob;
pgoff_t index = pos >> PAGE_CACHE_SHIFT; pgoff_t index = pos >> PAGE_CACHE_SHIFT;
struct page *page; struct page *vmpage = NULL;
int rc; unsigned int from = pos & (PAGE_CACHE_SIZE - 1);
unsigned from = pos & (PAGE_CACHE_SIZE - 1); unsigned int to = from + len;
int result = 0;
page = grab_cache_page_write_begin(mapping, index, flags); CDEBUG(D_VFSTRACE, "Writing %lu of %d to %d bytes\n", index, from, len);
if (!page)
return -ENOMEM; lcc = ll_cl_init(file, NULL);
if (IS_ERR(lcc)) {
result = PTR_ERR(lcc);
goto out;
}
env = lcc->lcc_env;
io = lcc->lcc_io;
/* To avoid deadlock, try to lock page first. */
vmpage = grab_cache_page_nowait(mapping, index);
if (unlikely(!vmpage || PageDirty(vmpage))) {
struct ccc_io *cio = ccc_env_io(env);
struct cl_page_list *plist = &cio->u.write.cui_queue;
/* if the page is already in dirty cache, we have to commit
* the pages right now; otherwise, it may cause deadlock
* because it holds page lock of a dirty page and request for
* more grants. It's okay for the dirty page to be the first
* one in commit page list, though.
*/
if (vmpage && PageDirty(vmpage) && plist->pl_nr > 0) {
unlock_page(vmpage);
page_cache_release(vmpage);
vmpage = NULL;
}
*pagep = page; /* commit pages and then wait for page lock */
result = vvp_io_write_commit(env, io);
if (result < 0)
goto out;
rc = ll_prepare_write(file, page, from, from + len); if (!vmpage) {
if (rc) { vmpage = grab_cache_page_write_begin(mapping, index,
unlock_page(page); flags);
page_cache_release(page); if (!vmpage) {
result = -ENOMEM;
goto out;
}
}
} }
return rc;
page = cl_page_find(env, clob, vmpage->index, vmpage, CPT_CACHEABLE);
if (IS_ERR(page)) {
result = PTR_ERR(page);
goto out;
}
lcc->lcc_page = page;
lu_ref_add(&page->cp_reference, "cl_io", io);
cl_page_assume(env, io, page);
if (!PageUptodate(vmpage)) {
/*
* We're completely overwriting an existing page,
* so _don't_ set it up to date until commit_write
*/
if (from == 0 && to == PAGE_SIZE) {
CL_PAGE_HEADER(D_PAGE, env, page, "full page write\n");
POISON_PAGE(vmpage, 0x11);
} else {
/* TODO: can be optimized at OSC layer to check if it
* is a lockless IO. In that case, it's not necessary
* to read the data.
*/
result = ll_prepare_partial_page(env, io, page);
if (result == 0)
SetPageUptodate(vmpage);
}
}
if (result < 0)
cl_page_unassume(env, io, page);
out:
if (result < 0) {
if (vmpage) {
unlock_page(vmpage);
page_cache_release(vmpage);
}
if (!IS_ERR(lcc))
ll_cl_fini(lcc);
} else {
*pagep = vmpage;
*fsdata = lcc;
}
return result;
} }
static int ll_write_end(struct file *file, struct address_space *mapping, static int ll_write_end(struct file *file, struct address_space *mapping,
loff_t pos, unsigned len, unsigned copied, loff_t pos, unsigned len, unsigned copied,
struct page *page, void *fsdata) struct page *vmpage, void *fsdata)
{ {
struct ll_cl_context *lcc = fsdata;
struct lu_env *env;
struct cl_io *io;
struct ccc_io *cio;
struct cl_page *page;
unsigned from = pos & (PAGE_CACHE_SIZE - 1); unsigned from = pos & (PAGE_CACHE_SIZE - 1);
int rc; bool unplug = false;
int result = 0;
page_cache_release(vmpage);
env = lcc->lcc_env;
page = lcc->lcc_page;
io = lcc->lcc_io;
cio = ccc_env_io(env);
LASSERT(cl_page_is_owned(page, io));
if (copied > 0) {
struct cl_page_list *plist = &cio->u.write.cui_queue;
lcc->lcc_page = NULL; /* page will be queued */
/* Add it into write queue */
cl_page_list_add(plist, page);
if (plist->pl_nr == 1) /* first page */
cio->u.write.cui_from = from;
else
LASSERT(from == 0);
cio->u.write.cui_to = from + copied;
/* We may have one full RPC, commit it soon */
if (plist->pl_nr >= PTLRPC_MAX_BRW_PAGES)
unplug = true;
CL_PAGE_DEBUG(D_VFSTRACE, env, page,
"queued page: %d.\n", plist->pl_nr);
} else {
cl_page_disown(env, io, page);
/* page list is not contiguous now, commit it now */
unplug = true;
}
rc = ll_commit_write(file, page, from, from + copied); if (unplug ||
unlock_page(page); file->f_flags & O_SYNC || IS_SYNC(file_inode(file)))
page_cache_release(page); result = vvp_io_write_commit(env, io);
return rc ?: copied; ll_cl_fini(lcc);
return result >= 0 ? copied : result;
} }
#ifdef CONFIG_MIGRATION #ifdef CONFIG_MIGRATION
......
...@@ -44,17 +44,15 @@ ...@@ -44,17 +44,15 @@
#include "../include/cl_object.h" #include "../include/cl_object.h"
#include "llite_internal.h" #include "llite_internal.h"
int vvp_io_init(const struct lu_env *env, int vvp_io_init(const struct lu_env *env, struct cl_object *obj,
struct cl_object *obj, struct cl_io *io); struct cl_io *io);
int vvp_lock_init(const struct lu_env *env, int vvp_lock_init(const struct lu_env *env, struct cl_object *obj,
struct cl_object *obj, struct cl_lock *lock, struct cl_lock *lock, const struct cl_io *io);
const struct cl_io *io);
int vvp_page_init(const struct lu_env *env, struct cl_object *obj, int vvp_page_init(const struct lu_env *env, struct cl_object *obj,
struct cl_page *page, struct page *vmpage); struct cl_page *page, struct page *vmpage);
struct lu_object *vvp_object_alloc(const struct lu_env *env, struct lu_object *vvp_object_alloc(const struct lu_env *env,
const struct lu_object_header *hdr, const struct lu_object_header *hdr,
struct lu_device *dev); struct lu_device *dev);
struct ccc_object *cl_inode2ccc(struct inode *inode); struct ccc_object *cl_inode2ccc(struct inode *inode);
extern const struct file_operations vvp_dump_pgcache_file_ops; extern const struct file_operations vvp_dump_pgcache_file_ops;
......
...@@ -444,8 +444,10 @@ struct lov_thread_info { ...@@ -444,8 +444,10 @@ struct lov_thread_info {
struct cl_lock_descr lti_ldescr; struct cl_lock_descr lti_ldescr;
struct ost_lvb lti_lvb; struct ost_lvb lti_lvb;
struct cl_2queue lti_cl2q; struct cl_2queue lti_cl2q;
struct cl_page_list lti_plist;
struct cl_lock_closure lti_closure; struct cl_lock_closure lti_closure;
wait_queue_t lti_waiter; wait_queue_t lti_waiter;
struct cl_attr lti_attr;
}; };
/** /**
......
...@@ -543,13 +543,6 @@ static void lov_io_unlock(const struct lu_env *env, ...@@ -543,13 +543,6 @@ static void lov_io_unlock(const struct lu_env *env,
LASSERT(rc == 0); LASSERT(rc == 0);
} }
static struct cl_page_list *lov_io_submit_qin(struct lov_device *ld,
struct cl_page_list *qin,
int idx, int alloc)
{
return alloc ? &qin[idx] : &ld->ld_emrg[idx]->emrg_page_list;
}
/** /**
* lov implementation of cl_operations::cio_submit() method. It takes a list * lov implementation of cl_operations::cio_submit() method. It takes a list
* of pages in \a queue, splits it into per-stripe sub-lists, invokes * of pages in \a queue, splits it into per-stripe sub-lists, invokes
...@@ -569,25 +562,17 @@ static int lov_io_submit(const struct lu_env *env, ...@@ -569,25 +562,17 @@ static int lov_io_submit(const struct lu_env *env,
const struct cl_io_slice *ios, const struct cl_io_slice *ios,
enum cl_req_type crt, struct cl_2queue *queue) enum cl_req_type crt, struct cl_2queue *queue)
{ {
struct lov_io *lio = cl2lov_io(env, ios); struct cl_page_list *qin = &queue->c2_qin;
struct lov_object *obj = lio->lis_object; struct lov_io *lio = cl2lov_io(env, ios);
struct lov_device *ld = lu2lov_dev(lov2cl(obj)->co_lu.lo_dev); struct lov_io_sub *sub;
struct cl_page_list *qin = &queue->c2_qin; struct cl_page_list *plist = &lov_env_info(env)->lti_plist;
struct cl_2queue *cl2q = &lov_env_info(env)->lti_cl2q;
struct cl_page_list *stripes_qin = NULL;
struct cl_page *page; struct cl_page *page;
struct cl_page *tmp;
int stripe; int stripe;
#define QIN(stripe) lov_io_submit_qin(ld, stripes_qin, stripe, alloc)
int rc = 0; int rc = 0;
int alloc =
!(current->flags & PF_MEMALLOC);
if (lio->lis_active_subios == 1) { if (lio->lis_active_subios == 1) {
int idx = lio->lis_single_subio_index; int idx = lio->lis_single_subio_index;
struct lov_io_sub *sub;
LASSERT(idx < lio->lis_nr_subios); LASSERT(idx < lio->lis_nr_subios);
sub = lov_sub_get(env, lio, idx); sub = lov_sub_get(env, lio, idx);
...@@ -600,119 +585,120 @@ static int lov_io_submit(const struct lu_env *env, ...@@ -600,119 +585,120 @@ static int lov_io_submit(const struct lu_env *env,
} }
LASSERT(lio->lis_subs); LASSERT(lio->lis_subs);
if (alloc) {
stripes_qin =
libcfs_kvzalloc(sizeof(*stripes_qin) *
lio->lis_nr_subios,
GFP_NOFS);
if (!stripes_qin)
return -ENOMEM;
for (stripe = 0; stripe < lio->lis_nr_subios; stripe++)
cl_page_list_init(&stripes_qin[stripe]);
} else {
/*
* If we get here, it means pageout & swap doesn't help.
* In order to not make things worse, even don't try to
* allocate the memory with __GFP_NOWARN. -jay
*/
mutex_lock(&ld->ld_mutex);
lio->lis_mem_frozen = 1;
}
cl_2queue_init(cl2q); cl_page_list_init(plist);
cl_page_list_for_each_safe(page, tmp, qin) { while (qin->pl_nr > 0) {
stripe = lov_page_stripe(page); struct cl_2queue *cl2q = &lov_env_info(env)->lti_cl2q;
cl_page_list_move(QIN(stripe), qin, page);
}
for (stripe = 0; stripe < lio->lis_nr_subios; stripe++) { cl_2queue_init(cl2q);
struct lov_io_sub *sub;
struct cl_page_list *sub_qin = QIN(stripe);
if (list_empty(&sub_qin->pl_pages)) page = cl_page_list_first(qin);
continue; cl_page_list_move(&cl2q->c2_qin, qin, page);
stripe = lov_page_stripe(page);
while (qin->pl_nr > 0) {
page = cl_page_list_first(qin);
if (stripe != lov_page_stripe(page))
break;
cl_page_list_move(&cl2q->c2_qin, qin, page);
}
cl_page_list_splice(sub_qin, &cl2q->c2_qin);
sub = lov_sub_get(env, lio, stripe); sub = lov_sub_get(env, lio, stripe);
if (!IS_ERR(sub)) { if (!IS_ERR(sub)) {
rc = cl_io_submit_rw(sub->sub_env, sub->sub_io, rc = cl_io_submit_rw(sub->sub_env, sub->sub_io,
crt, cl2q); crt, cl2q);
lov_sub_put(sub); lov_sub_put(sub);
} else } else {
rc = PTR_ERR(sub); rc = PTR_ERR(sub);
cl_page_list_splice(&cl2q->c2_qin, &queue->c2_qin); }
cl_page_list_splice(&cl2q->c2_qin, plist);
cl_page_list_splice(&cl2q->c2_qout, &queue->c2_qout); cl_page_list_splice(&cl2q->c2_qout, &queue->c2_qout);
cl_2queue_fini(env, cl2q);
if (rc != 0) if (rc != 0)
break; break;
} }
for (stripe = 0; stripe < lio->lis_nr_subios; stripe++) { cl_page_list_splice(plist, qin);
struct cl_page_list *sub_qin = QIN(stripe); cl_page_list_fini(env, plist);
if (list_empty(&sub_qin->pl_pages)) return rc;
continue; }
static int lov_io_commit_async(const struct lu_env *env,
const struct cl_io_slice *ios,
struct cl_page_list *queue, int from, int to,
cl_commit_cbt cb)
{
struct cl_page_list *plist = &lov_env_info(env)->lti_plist;
struct lov_io *lio = cl2lov_io(env, ios);
struct lov_io_sub *sub;
struct cl_page *page;
int rc = 0;
cl_page_list_splice(sub_qin, qin); if (lio->lis_active_subios == 1) {
int idx = lio->lis_single_subio_index;
LASSERT(idx < lio->lis_nr_subios);
sub = lov_sub_get(env, lio, idx);
LASSERT(!IS_ERR(sub));
LASSERT(sub->sub_io == &lio->lis_single_subio);
rc = cl_io_commit_async(sub->sub_env, sub->sub_io, queue,
from, to, cb);
lov_sub_put(sub);
return rc;
} }
if (alloc) { LASSERT(lio->lis_subs);
kvfree(stripes_qin);
} else {
int i;
for (i = 0; i < lio->lis_nr_subios; i++) { cl_page_list_init(plist);
struct cl_io *cio = lio->lis_subs[i].sub_io; while (queue->pl_nr > 0) {
int stripe_to = to;
int stripe;
if (cio && cio == &ld->ld_emrg[i]->emrg_subio) LASSERT(plist->pl_nr == 0);
lov_io_sub_fini(env, lio, &lio->lis_subs[i]); page = cl_page_list_first(queue);
cl_page_list_move(plist, queue, page);
stripe = lov_page_stripe(page);
while (queue->pl_nr > 0) {
page = cl_page_list_first(queue);
if (stripe != lov_page_stripe(page))
break;
cl_page_list_move(plist, queue, page);
} }
lio->lis_mem_frozen = 0;
mutex_unlock(&ld->ld_mutex);
}
return rc; if (queue->pl_nr > 0) /* still has more pages */
#undef QIN stripe_to = PAGE_SIZE;
}
static int lov_io_prepare_write(const struct lu_env *env, sub = lov_sub_get(env, lio, stripe);
const struct cl_io_slice *ios, if (!IS_ERR(sub)) {
const struct cl_page_slice *slice, rc = cl_io_commit_async(sub->sub_env, sub->sub_io,
unsigned from, unsigned to) plist, from, stripe_to, cb);
{ lov_sub_put(sub);
struct lov_io *lio = cl2lov_io(env, ios); } else {
struct cl_page *sub_page = lov_sub_page(slice); rc = PTR_ERR(sub);
struct lov_io_sub *sub; break;
int result; }
sub = lov_page_subio(env, lio, slice); if (plist->pl_nr > 0) /* short write */
if (!IS_ERR(sub)) { break;
result = cl_io_prepare_write(sub->sub_env, sub->sub_io,
sub_page, from, to);
lov_sub_put(sub);
} else
result = PTR_ERR(sub);
return result;
}
static int lov_io_commit_write(const struct lu_env *env, from = 0;
const struct cl_io_slice *ios, }
const struct cl_page_slice *slice,
unsigned from, unsigned to)
{
struct lov_io *lio = cl2lov_io(env, ios);
struct cl_page *sub_page = lov_sub_page(slice);
struct lov_io_sub *sub;
int result;
sub = lov_page_subio(env, lio, slice); /* for error case, add the page back into the qin list */
if (!IS_ERR(sub)) { LASSERT(ergo(rc == 0, plist->pl_nr == 0));
result = cl_io_commit_write(sub->sub_env, sub->sub_io, while (plist->pl_nr > 0) {
sub_page, from, to); /* error occurred, add the uncommitted pages back into queue */
lov_sub_put(sub); page = cl_page_list_last(plist);
} else cl_page_list_move_head(queue, plist, page);
result = PTR_ERR(sub); }
return result;
return rc;
} }
static int lov_io_fault_start(const struct lu_env *env, static int lov_io_fault_start(const struct lu_env *env,
...@@ -803,16 +789,8 @@ static const struct cl_io_operations lov_io_ops = { ...@@ -803,16 +789,8 @@ static const struct cl_io_operations lov_io_ops = {
.cio_fini = lov_io_fini .cio_fini = lov_io_fini
} }
}, },
.req_op = { .cio_submit = lov_io_submit,
[CRT_READ] = { .cio_commit_async = lov_io_commit_async,
.cio_submit = lov_io_submit
},
[CRT_WRITE] = {
.cio_submit = lov_io_submit
}
},
.cio_prepare_write = lov_io_prepare_write,
.cio_commit_write = lov_io_commit_write
}; };
/***************************************************************************** /*****************************************************************************
...@@ -880,15 +858,8 @@ static const struct cl_io_operations lov_empty_io_ops = { ...@@ -880,15 +858,8 @@ static const struct cl_io_operations lov_empty_io_ops = {
.cio_fini = lov_empty_io_fini .cio_fini = lov_empty_io_fini
} }
}, },
.req_op = { .cio_submit = LOV_EMPTY_IMPOSSIBLE,
[CRT_READ] = { .cio_commit_async = LOV_EMPTY_IMPOSSIBLE
.cio_submit = LOV_EMPTY_IMPOSSIBLE
},
[CRT_WRITE] = {
.cio_submit = LOV_EMPTY_IMPOSSIBLE
}
},
.cio_commit_write = LOV_EMPTY_IMPOSSIBLE
}; };
int lov_io_init_raid0(const struct lu_env *env, struct cl_object *obj, int lov_io_init_raid0(const struct lu_env *env, struct cl_object *obj,
......
...@@ -105,29 +105,6 @@ static void lov_page_assume(const struct lu_env *env, ...@@ -105,29 +105,6 @@ static void lov_page_assume(const struct lu_env *env,
lov_page_own(env, slice, io, 0); lov_page_own(env, slice, io, 0);
} }
static int lov_page_cache_add(const struct lu_env *env,
const struct cl_page_slice *slice,
struct cl_io *io)
{
struct lov_io *lio = lov_env_io(env);
struct lov_io_sub *sub;
int rc = 0;
LINVRNT(lov_page_invariant(slice));
LINVRNT(!cl2lov_page(slice)->lps_invalid);
sub = lov_page_subio(env, lio, slice);
if (!IS_ERR(sub)) {
rc = cl_page_cache_add(sub->sub_env, sub->sub_io,
slice->cpl_page->cp_child, CRT_WRITE);
lov_sub_put(sub);
} else {
rc = PTR_ERR(sub);
CL_PAGE_DEBUG(D_ERROR, env, slice->cpl_page, "rc = %d\n", rc);
}
return rc;
}
static int lov_page_print(const struct lu_env *env, static int lov_page_print(const struct lu_env *env,
const struct cl_page_slice *slice, const struct cl_page_slice *slice,
void *cookie, lu_printer_t printer) void *cookie, lu_printer_t printer)
...@@ -141,11 +118,6 @@ static const struct cl_page_operations lov_page_ops = { ...@@ -141,11 +118,6 @@ static const struct cl_page_operations lov_page_ops = {
.cpo_fini = lov_page_fini, .cpo_fini = lov_page_fini,
.cpo_own = lov_page_own, .cpo_own = lov_page_own,
.cpo_assume = lov_page_assume, .cpo_assume = lov_page_assume,
.io = {
[CRT_WRITE] = {
.cpo_cache_add = lov_page_cache_add
}
},
.cpo_print = lov_page_print .cpo_print = lov_page_print
}; };
......
...@@ -782,77 +782,29 @@ int cl_io_read_page(const struct lu_env *env, struct cl_io *io, ...@@ -782,77 +782,29 @@ int cl_io_read_page(const struct lu_env *env, struct cl_io *io,
EXPORT_SYMBOL(cl_io_read_page); EXPORT_SYMBOL(cl_io_read_page);
/** /**
* Called by write io to prepare page to receive data from user buffer. * Commit a list of contiguous pages into writeback cache.
* *
* \see cl_io_operations::cio_prepare_write() * \returns 0 if all pages committed, or errcode if error occurred.
* \see cl_io_operations::cio_commit_async()
*/ */
int cl_io_prepare_write(const struct lu_env *env, struct cl_io *io, int cl_io_commit_async(const struct lu_env *env, struct cl_io *io,
struct cl_page *page, unsigned from, unsigned to) struct cl_page_list *queue, int from, int to,
cl_commit_cbt cb)
{ {
const struct cl_io_slice *scan; const struct cl_io_slice *scan;
int result = 0; int result = 0;
LINVRNT(io->ci_type == CIT_WRITE);
LINVRNT(cl_page_is_owned(page, io));
LINVRNT(io->ci_state == CIS_IO_GOING || io->ci_state == CIS_LOCKED);
LINVRNT(cl_io_invariant(io));
LASSERT(cl_page_in_io(page, io));
cl_io_for_each_reverse(scan, io) {
if (scan->cis_iop->cio_prepare_write) {
const struct cl_page_slice *slice;
slice = cl_io_slice_page(scan, page);
result = scan->cis_iop->cio_prepare_write(env, scan,
slice,
from, to);
if (result != 0)
break;
}
}
return result;
}
EXPORT_SYMBOL(cl_io_prepare_write);
/**
* Called by write io after user data were copied into a page.
*
* \see cl_io_operations::cio_commit_write()
*/
int cl_io_commit_write(const struct lu_env *env, struct cl_io *io,
struct cl_page *page, unsigned from, unsigned to)
{
const struct cl_io_slice *scan;
int result = 0;
LINVRNT(io->ci_type == CIT_WRITE);
LINVRNT(io->ci_state == CIS_IO_GOING || io->ci_state == CIS_LOCKED);
LINVRNT(cl_io_invariant(io));
/*
* XXX Uh... not nice. Top level cl_io_commit_write() call (vvp->lov)
* already called cl_page_cache_add(), moving page into CPS_CACHED
* state. Better (and more general) way of dealing with such situation
* is needed.
*/
LASSERT(cl_page_is_owned(page, io) || page->cp_parent);
LASSERT(cl_page_in_io(page, io));
cl_io_for_each(scan, io) { cl_io_for_each(scan, io) {
if (scan->cis_iop->cio_commit_write) { if (!scan->cis_iop->cio_commit_async)
const struct cl_page_slice *slice; continue;
result = scan->cis_iop->cio_commit_async(env, scan, queue,
slice = cl_io_slice_page(scan, page); from, to, cb);
result = scan->cis_iop->cio_commit_write(env, scan, if (result != 0)
slice, break;
from, to);
if (result != 0)
break;
}
} }
LINVRNT(result <= 0);
return result; return result;
} }
EXPORT_SYMBOL(cl_io_commit_write); EXPORT_SYMBOL(cl_io_commit_async);
/** /**
* Submits a list of pages for immediate io. * Submits a list of pages for immediate io.
...@@ -870,13 +822,10 @@ int cl_io_submit_rw(const struct lu_env *env, struct cl_io *io, ...@@ -870,13 +822,10 @@ int cl_io_submit_rw(const struct lu_env *env, struct cl_io *io,
const struct cl_io_slice *scan; const struct cl_io_slice *scan;
int result = 0; int result = 0;
LINVRNT(crt < ARRAY_SIZE(scan->cis_iop->req_op));
cl_io_for_each(scan, io) { cl_io_for_each(scan, io) {
if (!scan->cis_iop->req_op[crt].cio_submit) if (!scan->cis_iop->cio_submit)
continue; continue;
result = scan->cis_iop->req_op[crt].cio_submit(env, scan, crt, result = scan->cis_iop->cio_submit(env, scan, crt, queue);
queue);
if (result != 0) if (result != 0)
break; break;
} }
...@@ -1073,8 +1022,8 @@ EXPORT_SYMBOL(cl_page_list_add); ...@@ -1073,8 +1022,8 @@ EXPORT_SYMBOL(cl_page_list_add);
/** /**
* Removes a page from a page list. * Removes a page from a page list.
*/ */
static void cl_page_list_del(const struct lu_env *env, void cl_page_list_del(const struct lu_env *env, struct cl_page_list *plist,
struct cl_page_list *plist, struct cl_page *page) struct cl_page *page)
{ {
LASSERT(plist->pl_nr > 0); LASSERT(plist->pl_nr > 0);
LINVRNT(plist->pl_owner == current); LINVRNT(plist->pl_owner == current);
...@@ -1087,6 +1036,7 @@ static void cl_page_list_del(const struct lu_env *env, ...@@ -1087,6 +1036,7 @@ static void cl_page_list_del(const struct lu_env *env,
lu_ref_del_at(&page->cp_reference, &page->cp_queue_ref, "queue", plist); lu_ref_del_at(&page->cp_reference, &page->cp_queue_ref, "queue", plist);
cl_page_put(env, page); cl_page_put(env, page);
} }
EXPORT_SYMBOL(cl_page_list_del);
/** /**
* Moves a page from one page list to another. * Moves a page from one page list to another.
...@@ -1106,6 +1056,24 @@ void cl_page_list_move(struct cl_page_list *dst, struct cl_page_list *src, ...@@ -1106,6 +1056,24 @@ void cl_page_list_move(struct cl_page_list *dst, struct cl_page_list *src,
} }
EXPORT_SYMBOL(cl_page_list_move); EXPORT_SYMBOL(cl_page_list_move);
/**
* Moves a page from one page list to the head of another list.
*/
void cl_page_list_move_head(struct cl_page_list *dst, struct cl_page_list *src,
struct cl_page *page)
{
LASSERT(src->pl_nr > 0);
LINVRNT(dst->pl_owner == current);
LINVRNT(src->pl_owner == current);
list_move(&page->cp_batch, &dst->pl_pages);
--src->pl_nr;
++dst->pl_nr;
lu_ref_set_at(&page->cp_reference, &page->cp_queue_ref, "queue",
src, dst);
}
EXPORT_SYMBOL(cl_page_list_move_head);
/** /**
* splice the cl_page_list, just as list head does * splice the cl_page_list, just as list head does
*/ */
...@@ -1163,8 +1131,7 @@ EXPORT_SYMBOL(cl_page_list_disown); ...@@ -1163,8 +1131,7 @@ EXPORT_SYMBOL(cl_page_list_disown);
/** /**
* Releases pages from queue. * Releases pages from queue.
*/ */
static void cl_page_list_fini(const struct lu_env *env, void cl_page_list_fini(const struct lu_env *env, struct cl_page_list *plist)
struct cl_page_list *plist)
{ {
struct cl_page *page; struct cl_page *page;
struct cl_page *temp; struct cl_page *temp;
...@@ -1175,6 +1142,7 @@ static void cl_page_list_fini(const struct lu_env *env, ...@@ -1175,6 +1142,7 @@ static void cl_page_list_fini(const struct lu_env *env,
cl_page_list_del(env, plist, page); cl_page_list_del(env, plist, page);
LASSERT(plist->pl_nr == 0); LASSERT(plist->pl_nr == 0);
} }
EXPORT_SYMBOL(cl_page_list_fini);
/** /**
* Assumes all pages in a queue. * Assumes all pages in a queue.
......
...@@ -1011,44 +1011,6 @@ int cl_page_make_ready(const struct lu_env *env, struct cl_page *pg, ...@@ -1011,44 +1011,6 @@ int cl_page_make_ready(const struct lu_env *env, struct cl_page *pg,
} }
EXPORT_SYMBOL(cl_page_make_ready); EXPORT_SYMBOL(cl_page_make_ready);
/**
* Notify layers that high level io decided to place this page into a cache
* for future transfer.
*
* The layer implementing transfer engine (osc) has to register this page in
* its queues.
*
* \pre cl_page_is_owned(pg, io)
* \post cl_page_is_owned(pg, io)
*
* \see cl_page_operations::cpo_cache_add()
*/
int cl_page_cache_add(const struct lu_env *env, struct cl_io *io,
struct cl_page *pg, enum cl_req_type crt)
{
const struct cl_page_slice *scan;
int result = 0;
PINVRNT(env, pg, crt < CRT_NR);
PINVRNT(env, pg, cl_page_is_owned(pg, io));
PINVRNT(env, pg, cl_page_invariant(pg));
if (crt >= CRT_NR)
return -EINVAL;
list_for_each_entry(scan, &pg->cp_layers, cpl_linkage) {
if (!scan->cpl_ops->io[crt].cpo_cache_add)
continue;
result = scan->cpl_ops->io[crt].cpo_cache_add(env, scan, io);
if (result != 0)
break;
}
CL_PAGE_HEADER(D_TRACE, env, pg, "%d %d\n", crt, result);
return result;
}
EXPORT_SYMBOL(cl_page_cache_add);
/** /**
* Called if a pge is being written back by kernel's intention. * Called if a pge is being written back by kernel's intention.
* *
......
...@@ -1085,22 +1085,17 @@ static int cl_echo_cancel0(struct lu_env *env, struct echo_device *ed, ...@@ -1085,22 +1085,17 @@ static int cl_echo_cancel0(struct lu_env *env, struct echo_device *ed,
return 0; return 0;
} }
static int cl_echo_async_brw(const struct lu_env *env, struct cl_io *io, static void echo_commit_callback(const struct lu_env *env, struct cl_io *io,
enum cl_req_type unused, struct cl_2queue *queue) struct cl_page *page)
{ {
struct cl_page *clp; struct echo_thread_info *info;
struct cl_page *temp; struct cl_2queue *queue;
int result = 0;
cl_page_list_for_each_safe(clp, temp, &queue->c2_qin) { info = echo_env_info(env);
int rc; LASSERT(io == &info->eti_io);
rc = cl_page_cache_add(env, io, clp, CRT_WRITE); queue = &info->eti_queue;
if (rc == 0) cl_page_list_add(&queue->c2_qout, page);
continue;
result = result ?: rc;
}
return result;
} }
static int cl_echo_object_brw(struct echo_object *eco, int rw, u64 offset, static int cl_echo_object_brw(struct echo_object *eco, int rw, u64 offset,
...@@ -1179,7 +1174,9 @@ static int cl_echo_object_brw(struct echo_object *eco, int rw, u64 offset, ...@@ -1179,7 +1174,9 @@ static int cl_echo_object_brw(struct echo_object *eco, int rw, u64 offset,
async = async && (typ == CRT_WRITE); async = async && (typ == CRT_WRITE);
if (async) if (async)
rc = cl_echo_async_brw(env, io, typ, queue); rc = cl_io_commit_async(env, io, &queue->c2_qin,
0, PAGE_SIZE,
echo_commit_callback);
else else
rc = cl_io_submit_sync(env, io, typ, queue, 0); rc = cl_io_submit_sync(env, io, typ, queue, 0);
CDEBUG(D_INFO, "echo_client %s write returns %d\n", CDEBUG(D_INFO, "echo_client %s write returns %d\n",
......
...@@ -879,10 +879,9 @@ int osc_extent_finish(const struct lu_env *env, struct osc_extent *ext, ...@@ -879,10 +879,9 @@ int osc_extent_finish(const struct lu_env *env, struct osc_extent *ext,
* span a whole chunk on the OST side, or our accounting goes * span a whole chunk on the OST side, or our accounting goes
* wrong. Should match the code in filter_grant_check. * wrong. Should match the code in filter_grant_check.
*/ */
int offset = oap->oap_page_off & ~PAGE_MASK; int offset = last_off & ~PAGE_MASK;
int count = oap->oap_count + (offset & (blocksize - 1)); int count = last_count + (offset & (blocksize - 1));
int end = (offset + oap->oap_count) & (blocksize - 1); int end = (offset + last_count) & (blocksize - 1);
if (end) if (end)
count += blocksize - end; count += blocksize - end;
...@@ -3131,14 +3130,13 @@ static int discard_cb(const struct lu_env *env, struct cl_io *io, ...@@ -3131,14 +3130,13 @@ static int discard_cb(const struct lu_env *env, struct cl_io *io,
struct cl_page *page = cl_page_top(ops->ops_cl.cpl_page); struct cl_page *page = cl_page_top(ops->ops_cl.cpl_page);
LASSERT(lock->cll_descr.cld_mode >= CLM_WRITE); LASSERT(lock->cll_descr.cld_mode >= CLM_WRITE);
KLASSERT(ergo(page->cp_type == CPT_CACHEABLE,
!PageWriteback(cl_page_vmpage(env, page))));
KLASSERT(ergo(page->cp_type == CPT_CACHEABLE,
!PageDirty(cl_page_vmpage(env, page))));
/* page is top page. */ /* page is top page. */
info->oti_next_index = osc_index(ops) + 1; info->oti_next_index = osc_index(ops) + 1;
if (cl_page_own(env, io, page) == 0) { if (cl_page_own(env, io, page) == 0) {
KLASSERT(ergo(page->cp_type == CPT_CACHEABLE,
!PageDirty(cl_page_vmpage(env, page))));
/* discard the page */ /* discard the page */
cl_page_discard(env, io, page); cl_page_discard(env, io, page);
cl_page_disown(env, io, page); cl_page_disown(env, io, page);
......
...@@ -453,6 +453,8 @@ int osc_prep_async_page(struct osc_object *osc, struct osc_page *ops, ...@@ -453,6 +453,8 @@ int osc_prep_async_page(struct osc_object *osc, struct osc_page *ops,
struct page *page, loff_t offset); struct page *page, loff_t offset);
int osc_queue_async_io(const struct lu_env *env, struct cl_io *io, int osc_queue_async_io(const struct lu_env *env, struct cl_io *io,
struct osc_page *ops); struct osc_page *ops);
int osc_page_cache_add(const struct lu_env *env,
const struct cl_page_slice *slice, struct cl_io *io);
int osc_teardown_async_page(const struct lu_env *env, struct osc_object *obj, int osc_teardown_async_page(const struct lu_env *env, struct osc_object *obj,
struct osc_page *ops); struct osc_page *ops);
int osc_flush_async_page(const struct lu_env *env, struct cl_io *io, int osc_flush_async_page(const struct lu_env *env, struct cl_io *io,
......
...@@ -83,6 +83,12 @@ struct osc_async_page { ...@@ -83,6 +83,12 @@ struct osc_async_page {
#define oap_count oap_brw_page.count #define oap_count oap_brw_page.count
#define oap_brw_flags oap_brw_page.flag #define oap_brw_flags oap_brw_page.flag
static inline struct osc_async_page *brw_page2oap(struct brw_page *pga)
{
return (struct osc_async_page *)container_of(pga, struct osc_async_page,
oap_brw_page);
}
struct osc_cache_waiter { struct osc_cache_waiter {
struct list_head ocw_entry; struct list_head ocw_entry;
wait_queue_head_t ocw_waitq; wait_queue_head_t ocw_waitq;
......
...@@ -185,6 +185,13 @@ static int osc_io_submit(const struct lu_env *env, ...@@ -185,6 +185,13 @@ static int osc_io_submit(const struct lu_env *env,
return qout->pl_nr > 0 ? 0 : result; return qout->pl_nr > 0 ? 0 : result;
} }
/**
* This is called when a page is accessed within file in a way that creates
* new page, if one were missing (i.e., if there were a hole at that place in
* the file, or accessed page is beyond the current file size).
*
* Expand stripe KMS if necessary.
*/
static void osc_page_touch_at(const struct lu_env *env, static void osc_page_touch_at(const struct lu_env *env,
struct cl_object *obj, pgoff_t idx, unsigned to) struct cl_object *obj, pgoff_t idx, unsigned to)
{ {
...@@ -208,7 +215,8 @@ static void osc_page_touch_at(const struct lu_env *env, ...@@ -208,7 +215,8 @@ static void osc_page_touch_at(const struct lu_env *env,
kms > loi->loi_kms ? "" : "not ", loi->loi_kms, kms, kms > loi->loi_kms ? "" : "not ", loi->loi_kms, kms,
loi->loi_lvb.lvb_size); loi->loi_lvb.lvb_size);
valid = 0; attr->cat_mtime = attr->cat_ctime = LTIME_S(CURRENT_TIME);
valid = CAT_MTIME | CAT_CTIME;
if (kms > loi->loi_kms) { if (kms > loi->loi_kms) {
attr->cat_kms = kms; attr->cat_kms = kms;
valid |= CAT_KMS; valid |= CAT_KMS;
...@@ -221,91 +229,83 @@ static void osc_page_touch_at(const struct lu_env *env, ...@@ -221,91 +229,83 @@ static void osc_page_touch_at(const struct lu_env *env,
cl_object_attr_unlock(obj); cl_object_attr_unlock(obj);
} }
/** static int osc_io_commit_async(const struct lu_env *env,
* This is called when a page is accessed within file in a way that creates const struct cl_io_slice *ios,
* new page, if one were missing (i.e., if there were a hole at that place in struct cl_page_list *qin, int from, int to,
* the file, or accessed page is beyond the current file size). Examples: cl_commit_cbt cb)
* ->commit_write() and ->nopage() methods.
*
* Expand stripe KMS if necessary.
*/
static void osc_page_touch(const struct lu_env *env,
struct osc_page *opage, unsigned to)
{
struct cl_page *page = opage->ops_cl.cpl_page;
struct cl_object *obj = opage->ops_cl.cpl_obj;
osc_page_touch_at(env, obj, page->cp_index, to);
}
/**
* Implements cl_io_operations::cio_prepare_write() method for osc layer.
*
* \retval -EIO transfer initiated against this osc will most likely fail
* \retval 0 transfer initiated against this osc will most likely succeed.
*
* The reason for this check is to immediately return an error to the caller
* in the case of a deactivated import. Note, that import can be deactivated
* later, while pages, dirtied by this IO, are still in the cache, but this is
* irrelevant, because that would still return an error to the application (if
* it does fsync), but many applications don't do fsync because of performance
* issues, and we wanted to return an -EIO at write time to notify the
* application.
*/
static int osc_io_prepare_write(const struct lu_env *env,
const struct cl_io_slice *ios,
const struct cl_page_slice *slice,
unsigned from, unsigned to)
{ {
struct osc_device *dev = lu2osc_dev(slice->cpl_obj->co_lu.lo_dev); struct cl_io *io = ios->cis_io;
struct obd_import *imp = class_exp2cliimp(dev->od_exp);
struct osc_io *oio = cl2osc_io(env, ios); struct osc_io *oio = cl2osc_io(env, ios);
struct osc_object *osc = cl2osc(ios->cis_obj);
struct cl_page *page;
struct cl_page *last_page;
struct osc_page *opg;
int result = 0; int result = 0;
LASSERT(qin->pl_nr > 0);
/* Handle partial page cases */
last_page = cl_page_list_last(qin);
if (oio->oi_lockless) {
page = cl_page_list_first(qin);
if (page == last_page) {
cl_page_clip(env, page, from, to);
} else {
if (from != 0)
cl_page_clip(env, page, from, PAGE_SIZE);
if (to != PAGE_SIZE)
cl_page_clip(env, last_page, 0, to);
}
}
/* /*
* This implements OBD_BRW_CHECK logic from old client. * NOTE: here @page is a top-level page. This is done to avoid
* creation of sub-page-list.
*/ */
while (qin->pl_nr > 0) {
struct osc_async_page *oap;
if (!imp || imp->imp_invalid) page = cl_page_list_first(qin);
result = -EIO; opg = osc_cl_page_osc(page);
if (result == 0 && oio->oi_lockless) oap = &opg->ops_oap;
/* this page contains `invalid' data, but who cares?
* nobody can access the invalid data.
* in osc_io_commit_write(), we're going to write exact
* [from, to) bytes of this page to OST. -jay
*/
cl_page_export(env, slice->cpl_page, 1);
return result; if (!list_empty(&oap->oap_rpc_item)) {
} CDEBUG(D_CACHE, "Busy oap %p page %p for submit.\n",
oap, opg);
result = -EBUSY;
break;
}
static int osc_io_commit_write(const struct lu_env *env, /* The page may be already in dirty cache. */
const struct cl_io_slice *ios, if (list_empty(&oap->oap_pending_item)) {
const struct cl_page_slice *slice, result = osc_page_cache_add(env, &opg->ops_cl, io);
unsigned from, unsigned to) if (result != 0)
{ break;
struct osc_io *oio = cl2osc_io(env, ios); }
struct osc_page *opg = cl2osc_page(slice);
struct osc_object *obj = cl2osc(opg->ops_cl.cpl_obj);
struct osc_async_page *oap = &opg->ops_oap;
LASSERT(to > 0); osc_page_touch_at(env, osc2cl(osc),
/* opg->ops_cl.cpl_page->cp_index,
* XXX instead of calling osc_page_touch() here and in page == last_page ? to : PAGE_SIZE);
* osc_io_fault_start() it might be more logical to introduce
* cl_page_touch() method, that generic cl_io_commit_write() and page
* fault code calls.
*/
osc_page_touch(env, cl2osc_page(slice), to);
if (!client_is_remote(osc_export(obj)) &&
capable(CFS_CAP_SYS_RESOURCE))
oap->oap_brw_flags |= OBD_BRW_NOQUOTA;
if (oio->oi_lockless) cl_page_list_del(env, qin, page);
/* see osc_io_prepare_write() for lockless io handling. */
cl_page_clip(env, slice->cpl_page, from, to);
return 0; (*cb)(env, io, page);
/* Can't access page any more. Page can be in transfer and
* complete at any time.
*/
}
/* for sync write, kernel will wait for this page to be flushed before
* osc_io_end() is called, so release it earlier.
* for mkwrite(), it's known there is no further pages.
*/
if (cl_io_is_sync_write(io) && oio->oi_active) {
osc_extent_release(env, oio->oi_active);
oio->oi_active = NULL;
}
CDEBUG(D_INFO, "%d %d\n", qin->pl_nr, result);
return result;
} }
static int osc_io_rw_iter_init(const struct lu_env *env, static int osc_io_rw_iter_init(const struct lu_env *env,
...@@ -719,16 +719,8 @@ static const struct cl_io_operations osc_io_ops = { ...@@ -719,16 +719,8 @@ static const struct cl_io_operations osc_io_ops = {
.cio_fini = osc_io_fini .cio_fini = osc_io_fini
} }
}, },
.req_op = { .cio_submit = osc_io_submit,
[CRT_READ] = { .cio_commit_async = osc_io_commit_async
.cio_submit = osc_io_submit
},
[CRT_WRITE] = {
.cio_submit = osc_io_submit
}
},
.cio_prepare_write = osc_io_prepare_write,
.cio_commit_write = osc_io_commit_write
}; };
/***************************************************************************** /*****************************************************************************
......
...@@ -89,8 +89,8 @@ static void osc_page_transfer_put(const struct lu_env *env, ...@@ -89,8 +89,8 @@ static void osc_page_transfer_put(const struct lu_env *env,
struct cl_page *page = cl_page_top(opg->ops_cl.cpl_page); struct cl_page *page = cl_page_top(opg->ops_cl.cpl_page);
if (opg->ops_transfer_pinned) { if (opg->ops_transfer_pinned) {
lu_ref_del(&page->cp_reference, "transfer", page);
opg->ops_transfer_pinned = 0; opg->ops_transfer_pinned = 0;
lu_ref_del(&page->cp_reference, "transfer", page);
cl_page_put(env, page); cl_page_put(env, page);
} }
} }
...@@ -113,11 +113,9 @@ static void osc_page_transfer_add(const struct lu_env *env, ...@@ -113,11 +113,9 @@ static void osc_page_transfer_add(const struct lu_env *env,
spin_unlock(&obj->oo_seatbelt); spin_unlock(&obj->oo_seatbelt);
} }
static int osc_page_cache_add(const struct lu_env *env, int osc_page_cache_add(const struct lu_env *env,
const struct cl_page_slice *slice, const struct cl_page_slice *slice, struct cl_io *io)
struct cl_io *io)
{ {
struct osc_io *oio = osc_env_io(env);
struct osc_page *opg = cl2osc_page(slice); struct osc_page *opg = cl2osc_page(slice);
int result; int result;
...@@ -130,17 +128,6 @@ static int osc_page_cache_add(const struct lu_env *env, ...@@ -130,17 +128,6 @@ static int osc_page_cache_add(const struct lu_env *env,
else else
osc_page_transfer_add(env, opg, CRT_WRITE); osc_page_transfer_add(env, opg, CRT_WRITE);
/* for sync write, kernel will wait for this page to be flushed before
* osc_io_end() is called, so release it earlier.
* for mkwrite(), it's known there is no further pages.
*/
if (cl_io_is_sync_write(io) || cl_io_is_mkwrite(io)) {
if (oio->oi_active) {
osc_extent_release(env, oio->oi_active);
oio->oi_active = NULL;
}
}
return result; return result;
} }
...@@ -231,17 +218,6 @@ static void osc_page_completion_write(const struct lu_env *env, ...@@ -231,17 +218,6 @@ static void osc_page_completion_write(const struct lu_env *env,
{ {
} }
static int osc_page_fail(const struct lu_env *env,
const struct cl_page_slice *slice,
struct cl_io *unused)
{
/*
* Cached read?
*/
LBUG();
return 0;
}
static const char *osc_list(struct list_head *head) static const char *osc_list(struct list_head *head)
{ {
return list_empty(head) ? "-" : "+"; return list_empty(head) ? "-" : "+";
...@@ -393,11 +369,9 @@ static const struct cl_page_operations osc_page_ops = { ...@@ -393,11 +369,9 @@ static const struct cl_page_operations osc_page_ops = {
.cpo_disown = osc_page_disown, .cpo_disown = osc_page_disown,
.io = { .io = {
[CRT_READ] = { [CRT_READ] = {
.cpo_cache_add = osc_page_fail,
.cpo_completion = osc_page_completion_read .cpo_completion = osc_page_completion_read
}, },
[CRT_WRITE] = { [CRT_WRITE] = {
.cpo_cache_add = osc_page_cache_add,
.cpo_completion = osc_page_completion_write .cpo_completion = osc_page_completion_write
} }
}, },
......
...@@ -1734,7 +1734,6 @@ static int brw_interpret(const struct lu_env *env, ...@@ -1734,7 +1734,6 @@ static int brw_interpret(const struct lu_env *env,
struct osc_brw_async_args *aa = data; struct osc_brw_async_args *aa = data;
struct osc_extent *ext; struct osc_extent *ext;
struct osc_extent *tmp; struct osc_extent *tmp;
struct cl_object *obj = NULL;
struct client_obd *cli = aa->aa_cli; struct client_obd *cli = aa->aa_cli;
rc = osc_brw_fini_request(req, rc); rc = osc_brw_fini_request(req, rc);
...@@ -1763,24 +1762,17 @@ static int brw_interpret(const struct lu_env *env, ...@@ -1763,24 +1762,17 @@ static int brw_interpret(const struct lu_env *env,
rc = -EIO; rc = -EIO;
} }
list_for_each_entry_safe(ext, tmp, &aa->aa_exts, oe_link) { if (rc == 0) {
if (!obj && rc == 0) {
obj = osc2cl(ext->oe_obj);
cl_object_get(obj);
}
list_del_init(&ext->oe_link);
osc_extent_finish(env, ext, 1, rc);
}
LASSERT(list_empty(&aa->aa_exts));
LASSERT(list_empty(&aa->aa_oaps));
if (obj) {
struct obdo *oa = aa->aa_oa; struct obdo *oa = aa->aa_oa;
struct cl_attr *attr = &osc_env_info(env)->oti_attr; struct cl_attr *attr = &osc_env_info(env)->oti_attr;
unsigned long valid = 0; unsigned long valid = 0;
struct cl_object *obj;
struct osc_async_page *last;
last = brw_page2oap(aa->aa_ppga[aa->aa_page_count - 1]);
obj = osc2cl(last->oap_obj);
LASSERT(rc == 0); cl_object_attr_lock(obj);
if (oa->o_valid & OBD_MD_FLBLOCKS) { if (oa->o_valid & OBD_MD_FLBLOCKS) {
attr->cat_blocks = oa->o_blocks; attr->cat_blocks = oa->o_blocks;
valid |= CAT_BLOCKS; valid |= CAT_BLOCKS;
...@@ -1797,15 +1789,39 @@ static int brw_interpret(const struct lu_env *env, ...@@ -1797,15 +1789,39 @@ static int brw_interpret(const struct lu_env *env,
attr->cat_ctime = oa->o_ctime; attr->cat_ctime = oa->o_ctime;
valid |= CAT_CTIME; valid |= CAT_CTIME;
} }
if (valid != 0) {
cl_object_attr_lock(obj); if (lustre_msg_get_opc(req->rq_reqmsg) == OST_WRITE) {
cl_object_attr_set(env, obj, attr, valid); struct lov_oinfo *loi = cl2osc(obj)->oo_oinfo;
cl_object_attr_unlock(obj); loff_t last_off = last->oap_count + last->oap_obj_off;
/* Change file size if this is an out of quota or
* direct IO write and it extends the file size
*/
if (loi->loi_lvb.lvb_size < last_off) {
attr->cat_size = last_off;
valid |= CAT_SIZE;
}
/* Extend KMS if it's not a lockless write */
if (loi->loi_kms < last_off &&
oap2osc_page(last)->ops_srvlock == 0) {
attr->cat_kms = last_off;
valid |= CAT_KMS;
}
} }
cl_object_put(env, obj);
if (valid != 0)
cl_object_attr_set(env, obj, attr, valid);
cl_object_attr_unlock(obj);
} }
kmem_cache_free(obdo_cachep, aa->aa_oa); kmem_cache_free(obdo_cachep, aa->aa_oa);
list_for_each_entry_safe(ext, tmp, &aa->aa_exts, oe_link) {
list_del_init(&ext->oe_link);
osc_extent_finish(env, ext, 1, rc);
}
LASSERT(list_empty(&aa->aa_exts));
LASSERT(list_empty(&aa->aa_oaps));
cl_req_completion(env, aa->aa_clerq, rc < 0 ? rc : cl_req_completion(env, aa->aa_clerq, rc < 0 ? rc :
req->rq_bulk->bd_nob_transferred); req->rq_bulk->bd_nob_transferred);
osc_release_ppga(aa->aa_ppga, aa->aa_page_count); osc_release_ppga(aa->aa_ppga, aa->aa_page_count);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment