Commit e8823bd6 authored by Artem Bityutskiy's avatar Artem Bityutskiy

UBI: fix atomic LEB change problems

When the UBI device is nearly full, i.e. all LEBs are mapped, we have
only one spare LEB left - the one we reserved for WL purposes. Well,
I do not count the LEBs which were reserved for bad PEB handling -
suppose NOR flash for simplicity. If an "atomic LEB change operation"
is run, and the WL unit is moving a LEB, we have no spare LEBs to
finish the operation and fail, which is not good. Moreover, if there
are 2 or more simultanious "atomic LEB change" requests, only one of
them has chances to succeed, the other will fail with -ENOSPC. Not
good either.

This patch does 2 things:
1. Reserves one PEB for the "atomic LEB change" operation.
2. Serealize the operations so that only on of them may run
   at a time (by means of a mutex).
Pointed-to-by: default avatarBrijesh Singh <brijesh.s.singh@gmail.com>
Signed-off-by: default avatarArtem Bityutskiy <Artem.Bityutskiy@nokia.com>
parent 6986646b
...@@ -46,6 +46,9 @@ ...@@ -46,6 +46,9 @@
#include <linux/err.h> #include <linux/err.h>
#include "ubi.h" #include "ubi.h"
/* Number of physical eraseblocks reserved for atomic LEB change operation */
#define EBA_RESERVED_PEBS 1
/** /**
* struct ltree_entry - an entry in the lock tree. * struct ltree_entry - an entry in the lock tree.
* @rb: links RB-tree nodes * @rb: links RB-tree nodes
...@@ -827,6 +830,9 @@ write_error: ...@@ -827,6 +830,9 @@ write_error:
* data, which has to be aligned. This function guarantees that in case of an * data, which has to be aligned. This function guarantees that in case of an
* unclean reboot the old contents is preserved. Returns zero in case of * unclean reboot the old contents is preserved. Returns zero in case of
* success and a negative error code in case of failure. * success and a negative error code in case of failure.
*
* UBI reserves one LEB for the "atomic LEB change" operation, so only one
* LEB change may be done at a time. This is ensured by @ubi->alc_mutex.
*/ */
int ubi_eba_atomic_leb_change(struct ubi_device *ubi, int vol_id, int lnum, int ubi_eba_atomic_leb_change(struct ubi_device *ubi, int vol_id, int lnum,
const void *buf, int len, int dtype) const void *buf, int len, int dtype)
...@@ -843,11 +849,10 @@ int ubi_eba_atomic_leb_change(struct ubi_device *ubi, int vol_id, int lnum, ...@@ -843,11 +849,10 @@ int ubi_eba_atomic_leb_change(struct ubi_device *ubi, int vol_id, int lnum,
if (!vid_hdr) if (!vid_hdr)
return -ENOMEM; return -ENOMEM;
mutex_lock(&ubi->alc_mutex);
err = leb_write_lock(ubi, vol_id, lnum); err = leb_write_lock(ubi, vol_id, lnum);
if (err) { if (err)
ubi_free_vid_hdr(ubi, vid_hdr); goto out_mutex;
return err;
}
vid_hdr->sqnum = cpu_to_be64(next_sqnum(ubi)); vid_hdr->sqnum = cpu_to_be64(next_sqnum(ubi));
vid_hdr->vol_id = cpu_to_be32(vol_id); vid_hdr->vol_id = cpu_to_be32(vol_id);
...@@ -864,9 +869,8 @@ int ubi_eba_atomic_leb_change(struct ubi_device *ubi, int vol_id, int lnum, ...@@ -864,9 +869,8 @@ int ubi_eba_atomic_leb_change(struct ubi_device *ubi, int vol_id, int lnum,
retry: retry:
pnum = ubi_wl_get_peb(ubi, dtype); pnum = ubi_wl_get_peb(ubi, dtype);
if (pnum < 0) { if (pnum < 0) {
ubi_free_vid_hdr(ubi, vid_hdr); err = pnum;
leb_write_unlock(ubi, vol_id, lnum); goto out_leb_unlock;
return pnum;
} }
dbg_eba("change LEB %d:%d, PEB %d, write VID hdr to PEB %d", dbg_eba("change LEB %d:%d, PEB %d, write VID hdr to PEB %d",
...@@ -888,17 +892,18 @@ retry: ...@@ -888,17 +892,18 @@ retry:
if (vol->eba_tbl[lnum] >= 0) { if (vol->eba_tbl[lnum] >= 0) {
err = ubi_wl_put_peb(ubi, vol->eba_tbl[lnum], 1); err = ubi_wl_put_peb(ubi, vol->eba_tbl[lnum], 1);
if (err) { if (err)
ubi_free_vid_hdr(ubi, vid_hdr); goto out_leb_unlock;
leb_write_unlock(ubi, vol_id, lnum);
return err;
}
} }
vol->eba_tbl[lnum] = pnum; vol->eba_tbl[lnum] = pnum;
out_leb_unlock:
leb_write_unlock(ubi, vol_id, lnum); leb_write_unlock(ubi, vol_id, lnum);
out_mutex:
mutex_unlock(&ubi->alc_mutex);
ubi_free_vid_hdr(ubi, vid_hdr); ubi_free_vid_hdr(ubi, vid_hdr);
return 0; return err;
write_error: write_error:
if (err != -EIO || !ubi->bad_allowed) { if (err != -EIO || !ubi->bad_allowed) {
...@@ -908,17 +913,13 @@ write_error: ...@@ -908,17 +913,13 @@ write_error:
* mode just in case. * mode just in case.
*/ */
ubi_ro_mode(ubi); ubi_ro_mode(ubi);
leb_write_unlock(ubi, vol_id, lnum); goto out_leb_unlock;
ubi_free_vid_hdr(ubi, vid_hdr);
return err;
} }
err = ubi_wl_put_peb(ubi, pnum, 1); err = ubi_wl_put_peb(ubi, pnum, 1);
if (err || ++tries > UBI_IO_RETRIES) { if (err || ++tries > UBI_IO_RETRIES) {
ubi_ro_mode(ubi); ubi_ro_mode(ubi);
leb_write_unlock(ubi, vol_id, lnum); goto out_leb_unlock;
ubi_free_vid_hdr(ubi, vid_hdr);
return err;
} }
vid_hdr->sqnum = cpu_to_be64(next_sqnum(ubi)); vid_hdr->sqnum = cpu_to_be64(next_sqnum(ubi));
...@@ -1122,6 +1123,7 @@ int ubi_eba_init_scan(struct ubi_device *ubi, struct ubi_scan_info *si) ...@@ -1122,6 +1123,7 @@ int ubi_eba_init_scan(struct ubi_device *ubi, struct ubi_scan_info *si)
dbg_eba("initialize EBA unit"); dbg_eba("initialize EBA unit");
spin_lock_init(&ubi->ltree_lock); spin_lock_init(&ubi->ltree_lock);
mutex_init(&ubi->alc_mutex);
ubi->ltree = RB_ROOT; ubi->ltree = RB_ROOT;
if (ubi_devices_cnt == 0) { if (ubi_devices_cnt == 0) {
...@@ -1183,6 +1185,14 @@ int ubi_eba_init_scan(struct ubi_device *ubi, struct ubi_scan_info *si) ...@@ -1183,6 +1185,14 @@ int ubi_eba_init_scan(struct ubi_device *ubi, struct ubi_scan_info *si)
ubi->rsvd_pebs += ubi->beb_rsvd_pebs; ubi->rsvd_pebs += ubi->beb_rsvd_pebs;
} }
if (ubi->avail_pebs < EBA_RESERVED_PEBS) {
ubi_err("no enough physical eraseblocks (%d, need %d)",
ubi->avail_pebs, EBA_RESERVED_PEBS);
goto out_free;
}
ubi->avail_pebs -= EBA_RESERVED_PEBS;
ubi->rsvd_pebs += EBA_RESERVED_PEBS;
dbg_eba("EBA unit is initialized"); dbg_eba("EBA unit is initialized");
return 0; return 0;
......
...@@ -221,14 +221,15 @@ struct ubi_wl_entry; ...@@ -221,14 +221,15 @@ struct ubi_wl_entry;
* @vtbl_slots: how many slots are available in the volume table * @vtbl_slots: how many slots are available in the volume table
* @vtbl_size: size of the volume table in bytes * @vtbl_size: size of the volume table in bytes
* @vtbl: in-RAM volume table copy * @vtbl: in-RAM volume table copy
* @vtbl_mutex: protects on-flash volume table
* *
* @max_ec: current highest erase counter value * @max_ec: current highest erase counter value
* @mean_ec: current mean erase counter value * @mean_ec: current mean erase counter value
* *
* global_sqnum: global sequence number * @global_sqnum: global sequence number
* @ltree_lock: protects the lock tree and @global_sqnum * @ltree_lock: protects the lock tree and @global_sqnum
* @ltree: the lock tree * @ltree: the lock tree
* @vtbl_mutex: protects on-flash volume table * @alc_mutex: serializes "atomic LEB change" operations
* *
* @used: RB-tree of used physical eraseblocks * @used: RB-tree of used physical eraseblocks
* @free: RB-tree of free physical eraseblocks * @free: RB-tree of free physical eraseblocks
...@@ -308,6 +309,7 @@ struct ubi_device { ...@@ -308,6 +309,7 @@ struct ubi_device {
unsigned long long global_sqnum; unsigned long long global_sqnum;
spinlock_t ltree_lock; spinlock_t ltree_lock;
struct rb_root ltree; struct rb_root ltree;
struct mutex alc_mutex;
/* Wear-leveling unit's stuff */ /* Wear-leveling unit's stuff */
struct rb_root used; struct rb_root used;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment