Commit c63e31c2 authored by David Teigland's avatar David Teigland Committed by Steven Whitehouse

[GFS2] journal recovery patch

This is one of the changes related to journal recovery I mentioned a
couple weeks ago.  We can get into a situation where there are only
readonly nodes currently mounting the fs, but there are journals that need
to be recovered.  Since the readonly nodes can't recover journals, the
next rw mounter needs to go through and check all journals and recover any
that are dirty (i.e. what the first node to mount the fs does).  This rw
mounter needs to skip the journals held by the existing readonly nodes.
Skipping those journals amounts to using the TRY flag on the journal locks
so acquiring the lock of a journal held by a readonly node will fail
instead of blocking indefinately.
Signed-off-by: default avatarDavid Teigland <teigland@redhat.com>
Signed-off-by: default avatarSteven Whitehouse <swhiteho@redhat.com>
parent 190562bd
...@@ -444,8 +444,7 @@ static int init_journal(struct gfs2_sbd *sdp, int undo) ...@@ -444,8 +444,7 @@ static int init_journal(struct gfs2_sbd *sdp, int undo)
if (sdp->sd_lockstruct.ls_first) { if (sdp->sd_lockstruct.ls_first) {
unsigned int x; unsigned int x;
for (x = 0; x < sdp->sd_journals; x++) { for (x = 0; x < sdp->sd_journals; x++) {
error = gfs2_recover_journal(gfs2_jdesc_find(sdp, x), error = gfs2_recover_journal(gfs2_jdesc_find(sdp, x));
WAIT);
if (error) { if (error) {
fs_err(sdp, "error recovering journal %u: %d\n", fs_err(sdp, "error recovering journal %u: %d\n",
x, error); x, error);
...@@ -455,7 +454,7 @@ static int init_journal(struct gfs2_sbd *sdp, int undo) ...@@ -455,7 +454,7 @@ static int init_journal(struct gfs2_sbd *sdp, int undo)
gfs2_lm_others_may_mount(sdp); gfs2_lm_others_may_mount(sdp);
} else if (!sdp->sd_args.ar_spectator) { } else if (!sdp->sd_args.ar_spectator) {
error = gfs2_recover_journal(sdp->sd_jdesc, WAIT); error = gfs2_recover_journal(sdp->sd_jdesc);
if (error) { if (error) {
fs_err(sdp, "error recovering my journal: %d\n", error); fs_err(sdp, "error recovering my journal: %d\n", error);
goto fail_jinode_gh; goto fail_jinode_gh;
......
...@@ -418,7 +418,6 @@ static int clean_journal(struct gfs2_jdesc *jd, struct gfs2_log_header *head) ...@@ -418,7 +418,6 @@ static int clean_journal(struct gfs2_jdesc *jd, struct gfs2_log_header *head)
/** /**
* gfs2_recover_journal - recovery a given journal * gfs2_recover_journal - recovery a given journal
* @jd: the struct gfs2_jdesc describing the journal * @jd: the struct gfs2_jdesc describing the journal
* @wait: Don't return until the journal is clean (or an error is encountered)
* *
* Acquire the journal's lock, check to see if the journal is clean, and * Acquire the journal's lock, check to see if the journal is clean, and
* do recovery if necessary. * do recovery if necessary.
...@@ -426,7 +425,7 @@ static int clean_journal(struct gfs2_jdesc *jd, struct gfs2_log_header *head) ...@@ -426,7 +425,7 @@ static int clean_journal(struct gfs2_jdesc *jd, struct gfs2_log_header *head)
* Returns: errno * Returns: errno
*/ */
int gfs2_recover_journal(struct gfs2_jdesc *jd, int wait) int gfs2_recover_journal(struct gfs2_jdesc *jd)
{ {
struct gfs2_inode *ip = jd->jd_inode->u.generic_ip; struct gfs2_inode *ip = jd->jd_inode->u.generic_ip;
struct gfs2_sbd *sdp = ip->i_sbd; struct gfs2_sbd *sdp = ip->i_sbd;
...@@ -441,12 +440,10 @@ int gfs2_recover_journal(struct gfs2_jdesc *jd, int wait) ...@@ -441,12 +440,10 @@ int gfs2_recover_journal(struct gfs2_jdesc *jd, int wait)
/* Aquire the journal lock so we can do recovery */ /* Aquire the journal lock so we can do recovery */
error = gfs2_glock_nq_num(sdp, error = gfs2_glock_nq_num(sdp, jd->jd_jid, &gfs2_journal_glops,
jd->jd_jid, &gfs2_journal_glops,
LM_ST_EXCLUSIVE, LM_ST_EXCLUSIVE,
LM_FLAG_NOEXP | LM_FLAG_NOEXP | LM_FLAG_TRY | GL_NOCACHE,
((wait) ? 0 : LM_FLAG_TRY) | &j_gh);
GL_NOCACHE, &j_gh);
switch (error) { switch (error) {
case 0: case 0:
break; break;
...@@ -574,7 +571,7 @@ void gfs2_check_journals(struct gfs2_sbd *sdp) ...@@ -574,7 +571,7 @@ void gfs2_check_journals(struct gfs2_sbd *sdp)
break; break;
if (jd != sdp->sd_jdesc) if (jd != sdp->sd_jdesc)
gfs2_recover_journal(jd, NO_WAIT); gfs2_recover_journal(jd);
} }
} }
...@@ -25,7 +25,7 @@ void gfs2_revoke_clean(struct gfs2_sbd *sdp); ...@@ -25,7 +25,7 @@ void gfs2_revoke_clean(struct gfs2_sbd *sdp);
int gfs2_find_jhead(struct gfs2_jdesc *jd, int gfs2_find_jhead(struct gfs2_jdesc *jd,
struct gfs2_log_header *head); struct gfs2_log_header *head);
int gfs2_recover_journal(struct gfs2_jdesc *gfs2_jd, int wait); int gfs2_recover_journal(struct gfs2_jdesc *gfs2_jd);
void gfs2_check_journals(struct gfs2_sbd *sdp); void gfs2_check_journals(struct gfs2_sbd *sdp);
#endif /* __RECOVERY_DOT_H__ */ #endif /* __RECOVERY_DOT_H__ */
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment