Commit 766c8ceb authored by Javier González's avatar Javier González Committed by Jens Axboe

lightnvm: pblk: guarantee that backpointer is respected on writer stall

pblk's write buffer must guarantee that it respects the device's
constrains for reads (i.e., mw_cunits). This is done by maintaining a
backpointer that updates the L2P table as entries wrap up, making them
point to the media instead of pointing to the write buffer.

This mechanism can race in case that the write thread stalls, as the
write pointer will protect the last written entry, thus disregarding the
read constrains.

This patch adds an extra check on wrap up, making sure that the
threshold is respected at all times, preventing new entries to overwrite
committed data, also in case of write thread stall.
Reported-by: default avatarHeiner Litz <hlitz@ucsc.edu>
Signed-off-by: default avatarJavier González <javier@cnexlabs.com>
Reviewed-by: default avatarHeiner Litz <hlitz@ucsc.edu>
Signed-off-by: default avatarMatias Bjørling <mb@lightnvm.io>
Signed-off-by: default avatarJens Axboe <axboe@kernel.dk>
parent 8a57fc38
...@@ -193,8 +193,9 @@ static int pblk_rwb_init(struct pblk *pblk) ...@@ -193,8 +193,9 @@ static int pblk_rwb_init(struct pblk *pblk)
struct nvm_tgt_dev *dev = pblk->dev; struct nvm_tgt_dev *dev = pblk->dev;
struct nvm_geo *geo = &dev->geo; struct nvm_geo *geo = &dev->geo;
unsigned long buffer_size; unsigned long buffer_size;
int pgs_in_buffer; int pgs_in_buffer, threshold;
threshold = geo->mw_cunits * geo->all_luns;
pgs_in_buffer = (max(geo->mw_cunits, geo->ws_opt) + geo->ws_opt) pgs_in_buffer = (max(geo->mw_cunits, geo->ws_opt) + geo->ws_opt)
* geo->all_luns; * geo->all_luns;
...@@ -203,7 +204,7 @@ static int pblk_rwb_init(struct pblk *pblk) ...@@ -203,7 +204,7 @@ static int pblk_rwb_init(struct pblk *pblk)
else else
buffer_size = pgs_in_buffer; buffer_size = pgs_in_buffer;
return pblk_rb_init(&pblk->rwb, buffer_size, geo->csecs); return pblk_rb_init(&pblk->rwb, buffer_size, threshold, geo->csecs);
} }
/* Minimum pages needed within a lun */ /* Minimum pages needed within a lun */
......
...@@ -56,7 +56,8 @@ static unsigned int pblk_rb_calculate_size(unsigned int nr_entries) ...@@ -56,7 +56,8 @@ static unsigned int pblk_rb_calculate_size(unsigned int nr_entries)
* allocated and their size must be a power of two * allocated and their size must be a power of two
* (Documentation/core-api/circular-buffers.rst) * (Documentation/core-api/circular-buffers.rst)
*/ */
int pblk_rb_init(struct pblk_rb *rb, unsigned int size, unsigned int seg_size) int pblk_rb_init(struct pblk_rb *rb, unsigned int size, unsigned int threshold,
unsigned int seg_size)
{ {
struct pblk *pblk = container_of(rb, struct pblk, rwb); struct pblk *pblk = container_of(rb, struct pblk, rwb);
struct pblk_rb_entry *entries; struct pblk_rb_entry *entries;
...@@ -79,6 +80,7 @@ int pblk_rb_init(struct pblk_rb *rb, unsigned int size, unsigned int seg_size) ...@@ -79,6 +80,7 @@ int pblk_rb_init(struct pblk_rb *rb, unsigned int size, unsigned int seg_size)
rb->seg_size = (1 << power_seg_sz); rb->seg_size = (1 << power_seg_sz);
rb->nr_entries = (1 << power_size); rb->nr_entries = (1 << power_size);
rb->mem = rb->subm = rb->sync = rb->l2p_update = 0; rb->mem = rb->subm = rb->sync = rb->l2p_update = 0;
rb->back_thres = threshold;
rb->flush_point = EMPTY_ENTRY; rb->flush_point = EMPTY_ENTRY;
spin_lock_init(&rb->w_lock); spin_lock_init(&rb->w_lock);
...@@ -404,11 +406,14 @@ static int __pblk_rb_may_write(struct pblk_rb *rb, unsigned int nr_entries, ...@@ -404,11 +406,14 @@ static int __pblk_rb_may_write(struct pblk_rb *rb, unsigned int nr_entries,
{ {
unsigned int mem; unsigned int mem;
unsigned int sync; unsigned int sync;
unsigned int threshold;
sync = READ_ONCE(rb->sync); sync = READ_ONCE(rb->sync);
mem = READ_ONCE(rb->mem); mem = READ_ONCE(rb->mem);
if (pblk_rb_ring_space(rb, mem, sync, rb->nr_entries) < nr_entries) threshold = nr_entries + rb->back_thres;
if (pblk_rb_ring_space(rb, mem, sync, rb->nr_entries) < threshold)
return 0; return 0;
if (pblk_rb_update_l2p(rb, nr_entries, mem, sync)) if (pblk_rb_update_l2p(rb, nr_entries, mem, sync))
......
...@@ -203,6 +203,11 @@ struct pblk_rb { ...@@ -203,6 +203,11 @@ struct pblk_rb {
* will be 4KB * will be 4KB
*/ */
unsigned int back_thres; /* Threshold that shall be maintained by
* the backpointer in order to respect
* geo->mw_cunits on a per chunk basis
*/
struct list_head pages; /* List of data pages */ struct list_head pages; /* List of data pages */
spinlock_t w_lock; /* Write lock */ spinlock_t w_lock; /* Write lock */
...@@ -734,7 +739,8 @@ struct pblk_line_ws { ...@@ -734,7 +739,8 @@ struct pblk_line_ws {
/* /*
* pblk ring buffer operations * pblk ring buffer operations
*/ */
int pblk_rb_init(struct pblk_rb *rb, unsigned int size, unsigned int seg_sz); int pblk_rb_init(struct pblk_rb *rb, unsigned int size, unsigned int threshold,
unsigned int seg_sz);
int pblk_rb_may_write_user(struct pblk_rb *rb, struct bio *bio, int pblk_rb_may_write_user(struct pblk_rb *rb, struct bio *bio,
unsigned int nr_entries, unsigned int *pos); unsigned int nr_entries, unsigned int *pos);
int pblk_rb_may_write_gc(struct pblk_rb *rb, unsigned int nr_entries, int pblk_rb_may_write_gc(struct pblk_rb *rb, unsigned int nr_entries,
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment