diff options
author | Junxiao Bi <junxiao.bi@oracle.com> | 2016-05-27 17:27:10 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2016-05-27 17:49:37 -0400 |
commit | 88dbe98dc72fa0c2b778210e2079cd69d2477b36 (patch) | |
tree | ce2ce48ac1b3592e9ba841c49101b72224b2ce94 /fs | |
parent | 1bd1290283d7939478062e80bdd9719d3a21522f (diff) |
ocfs2: o2hb: don't negotiate if last hb fail
Sometimes io error is returned when storage is down for a while. Like
for iscsi device, stroage is made offline when session timeout, and this
will make all io return -EIO. For this case, nodes shouldn't do
negotiate timeout but should fence self. So let nodes fence self when
o2hb_do_disk_heartbeat return an error, this is the same behavior with
o2hb without negotiate timer.
Signed-off-by: Junxiao Bi <junxiao.bi@oracle.com>
Reviewed-by: Ryan Ding <ryan.ding@oracle.com>
Reviewed-by: Mark Fasheh <mfasheh@suse.de>
Cc: Gang He <ghe@suse.com>
Cc: rwxybh <rwxybh@126.com>
Cc: Joel Becker <jlbec@evilplan.org>
Cc: Joseph Qi <joseph.qi@huawei.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'fs')
-rw-r--r-- | fs/ocfs2/cluster/heartbeat.c | 10 |
1 files changed, 10 insertions, 0 deletions
diff --git a/fs/ocfs2/cluster/heartbeat.c b/fs/ocfs2/cluster/heartbeat.c index 84ebeb5678c6..31a5c0803e0a 100644 --- a/fs/ocfs2/cluster/heartbeat.c +++ b/fs/ocfs2/cluster/heartbeat.c | |||
@@ -284,6 +284,9 @@ struct o2hb_region { | |||
284 | /* Message key for negotiate timeout message. */ | 284 | /* Message key for negotiate timeout message. */ |
285 | unsigned int hr_key; | 285 | unsigned int hr_key; |
286 | struct list_head hr_handler_list; | 286 | struct list_head hr_handler_list; |
287 | |||
288 | /* last hb status, 0 for success, other value for error. */ | ||
289 | int hr_last_hb_status; | ||
287 | }; | 290 | }; |
288 | 291 | ||
289 | struct o2hb_bio_wait_ctxt { | 292 | struct o2hb_bio_wait_ctxt { |
@@ -395,6 +398,12 @@ static void o2hb_nego_timeout(struct work_struct *work) | |||
395 | struct o2hb_region *reg; | 398 | struct o2hb_region *reg; |
396 | 399 | ||
397 | reg = container_of(work, struct o2hb_region, hr_nego_timeout_work.work); | 400 | reg = container_of(work, struct o2hb_region, hr_nego_timeout_work.work); |
401 | /* don't negotiate timeout if last hb failed since it is very | ||
402 | * possible io failed. Should let write timeout fence self. | ||
403 | */ | ||
404 | if (reg->hr_last_hb_status) | ||
405 | return; | ||
406 | |||
398 | o2hb_fill_node_map(live_node_bitmap, sizeof(live_node_bitmap)); | 407 | o2hb_fill_node_map(live_node_bitmap, sizeof(live_node_bitmap)); |
399 | /* lowest node as master node to make negotiate decision. */ | 408 | /* lowest node as master node to make negotiate decision. */ |
400 | master_node = find_next_bit(live_node_bitmap, O2NM_MAX_NODES, 0); | 409 | master_node = find_next_bit(live_node_bitmap, O2NM_MAX_NODES, 0); |
@@ -1228,6 +1237,7 @@ static int o2hb_thread(void *data) | |||
1228 | before_hb = ktime_get_real(); | 1237 | before_hb = ktime_get_real(); |
1229 | 1238 | ||
1230 | ret = o2hb_do_disk_heartbeat(reg); | 1239 | ret = o2hb_do_disk_heartbeat(reg); |
1240 | reg->hr_last_hb_status = ret; | ||
1231 | 1241 | ||
1232 | after_hb = ktime_get_real(); | 1242 | after_hb = ktime_get_real(); |
1233 | 1243 | ||