Safeguard against writing to an active device of another node

Modifying an exiting device's superblock or creating a new superblock
on an existing device needs to be checked because the device could be
in use by another node in another array. So, we check this by taking
all superblock locks in userspace so that we don't  step onto an active
device used by another node and safeguard against accidental edits.
After the edit is complete, we release all locks and the lockspace so
that it can be used by the kernel space.

Signed-off-by: Goldwyn Rodrigues <rgoldwyn@suse.com>
Signed-off-by: Guoqing Jiang <gqjiang@suse.com>
Signed-off-by: NeilBrown <neilb@suse.com>
This commit is contained in:
Guoqing Jiang 2015-10-19 16:03:19 +08:00 committed by NeilBrown
parent 28d744468e
commit d15a1f72bd
5 changed files with 248 additions and 1 deletions

View File

@ -81,11 +81,12 @@ FAILED_SLOTS_DIR = $(RUN_DIR)/failed-slots
SYSTEMD_DIR=/lib/systemd/system
COROSYNC:=$(shell [ -d /usr/include/corosync ] || echo -DNO_COROSYNC)
DLM:=$(shell [ -f /usr/include/libdlm.h ] || echo -DNO_DLM)
DIRFLAGS = -DMAP_DIR=\"$(MAP_DIR)\" -DMAP_FILE=\"$(MAP_FILE)\"
DIRFLAGS += -DMDMON_DIR=\"$(MDMON_DIR)\"
DIRFLAGS += -DFAILED_SLOTS_DIR=\"$(FAILED_SLOTS_DIR)\"
CFLAGS = $(CWFLAGS) $(CXFLAGS) -DSendmail=\""$(MAILCMD)"\" $(CONFFILEFLAGS) $(DIRFLAGS) $(COROSYNC)
CFLAGS = $(CWFLAGS) $(CXFLAGS) -DSendmail=\""$(MAILCMD)"\" $(CONFFILEFLAGS) $(DIRFLAGS) $(COROSYNC) $(DLM)
VERSION = $(shell [ -d .git ] && git describe HEAD | sed 's/mdadm-//')
VERS_DATE = $(shell [ -d .git ] && date --date="`git log -n1 --format=format:%cd --date=short`" '+%0dth %B %Y' | sed -e 's/1th/1st/' -e 's/2th/2nd/' -e 's/11st/11th/' -e 's/12nd/12th/')

View File

@ -1346,6 +1346,8 @@ int main(int argc, char *argv[])
/* --scan implied --brief unless -vv */
c.brief = 1;
set_dlm_hooks(); /* get dlm funcs from libdlm_lt.so.3 */
switch(mode) {
case MANAGE:
/* readonly, add/remove, readwrite, runstop */

45
mdadm.h
View File

@ -35,6 +35,7 @@ extern __off64_t lseek64 __P ((int __fd, __off64_t __offset, int __whence));
#include <sys/types.h>
#include <sys/stat.h>
#include <stdint.h>
#include <stdlib.h>
#include <time.h>
#include <sys/time.h>
@ -51,6 +52,25 @@ extern __off64_t lseek64 __P ((int __fd, __off64_t __offset, int __whence));
#define srandom srand
#endif
#ifndef NO_DLM
#include <libdlm.h>
#include <errno.h>
#else
#define LKF_NOQUEUE 0x00000001
#define LKF_CONVERT 0x00000004
#define LKM_PWMODE 4
#define EUNLOCK 0x10002
typedef void *dlm_lshandle_t;
struct dlm_lksb {
int sb_status;
uint32_t sb_lkid;
char sb_flags;
char *sb_lvbptr;
};
#endif
#include <linux/kdev_t.h>
/*#include <linux/fs.h> */
#include <sys/mount.h>
@ -1423,7 +1443,32 @@ extern char *stat2devnm(struct stat *st);
extern char *fd2devnm(int fd);
extern int in_initrd(void);
struct dlm_hooks {
void *dlm_handle; /* dlm lib related */
dlm_lshandle_t (*create_lockspace)(const char *name,
unsigned int mode);
int (*release_lockspace)(const char *name, dlm_lshandle_t ls,
int force);
int (*ls_lock)(dlm_lshandle_t lockspace, uint32_t mode,
struct dlm_lksb *lksb, uint32_t flags,
const void *name, unsigned int namelen,
uint32_t parent, void (*astaddr) (void *astarg),
void *astarg, void (*bastaddr) (void *astarg),
void *range);
int (*ls_unlock)(dlm_lshandle_t lockspace, uint32_t lkid,
uint32_t flags, struct dlm_lksb *lksb,
void *astarg);
int (*ls_get_fd)(dlm_lshandle_t ls);
int (*dispatch)(int fd);
};
extern int get_cluster_name(char **name);
extern int is_clustered(struct supertype *st);
extern int cluster_get_dlmlock(struct supertype *st, int *lockid);
extern int cluster_release_dlmlock(struct supertype *st, int lockid);
extern void set_dlm_hooks(void);
#define _ROUND_UP(val, base) (((val) + (base) - 1) & ~(base - 1))
#define ROUND_UP(val, base) _ROUND_UP(val, (typeof(val))(base))

View File

@ -1110,8 +1110,18 @@ static int update_super1(struct supertype *st, struct mdinfo *info,
* ignored.
*/
int rv = 0;
int lockid;
struct mdp_superblock_1 *sb = st->sb;
if (is_clustered(st)) {
rv = cluster_get_dlmlock(st, &lockid);
if (rv) {
pr_err("Cannot get dlmlock in %s return %d\n", __func__, rv);
cluster_release_dlmlock(st, lockid);
return rv;
}
}
if (strcmp(update, "homehost") == 0 &&
homehost) {
/* Note that 'homehost' is special as it is really
@ -1370,6 +1380,9 @@ static int update_super1(struct supertype *st, struct mdinfo *info,
rv = -1;
sb->sb_csum = calc_sb_1_csum(sb);
if (is_clustered(st))
cluster_release_dlmlock(st, lockid);
return rv;
}
@ -1473,6 +1486,16 @@ static int add_to_super1(struct supertype *st, mdu_disk_info_t *dk,
struct mdp_superblock_1 *sb = st->sb;
__u16 *rp = sb->dev_roles + dk->number;
struct devinfo *di, **dip;
int rv, lockid;
if (is_clustered(st)) {
rv = cluster_get_dlmlock(st, &lockid);
if (rv) {
pr_err("Cannot get dlmlock in %s return %d\n", __func__, rv);
cluster_release_dlmlock(st, lockid);
return rv;
}
}
if ((dk->state & 6) == 6) /* active, sync */
*rp = __cpu_to_le16(dk->raid_disk);
@ -1502,6 +1525,9 @@ static int add_to_super1(struct supertype *st, mdu_disk_info_t *dk,
di->next = NULL;
*dip = di;
if (is_clustered(st))
cluster_release_dlmlock(st, lockid);
return 0;
}
#endif
@ -1515,6 +1541,16 @@ static int store_super1(struct supertype *st, int fd)
struct align_fd afd;
int sbsize;
unsigned long long dsize;
int rv, lockid;
if (is_clustered(st)) {
rv = cluster_get_dlmlock(st, &lockid);
if (rv) {
pr_err("Cannot get dlmlock in %s return %d\n", __func__, rv);
cluster_release_dlmlock(st, lockid);
return rv;
}
}
if (!get_dev_size(fd, NULL, &dsize))
return 1;
@ -1575,6 +1611,9 @@ static int store_super1(struct supertype *st, int fd)
}
}
fsync(fd);
if (is_clustered(st))
cluster_release_dlmlock(st, lockid);
return 0;
}
@ -2391,6 +2430,16 @@ static int write_bitmap1(struct supertype *st, int fd, enum bitmap_update update
static void free_super1(struct supertype *st)
{
int rv, lockid;
if (is_clustered(st)) {
rv = cluster_get_dlmlock(st, &lockid);
if (rv) {
pr_err("Cannot get dlmlock in %s return %d\n", __func__, rv);
cluster_release_dlmlock(st, lockid);
return;
}
}
if (st->sb)
free(st->sb);
while (st->info) {
@ -2401,6 +2450,8 @@ static void free_super1(struct supertype *st)
free(di);
}
st->sb = NULL;
if (is_clustered(st))
cluster_release_dlmlock(st, lockid);
}
#ifndef MDASSEMBLE

148
util.c
View File

@ -24,6 +24,7 @@
#include "mdadm.h"
#include "md_p.h"
#include <sys/poll.h>
#include <sys/socket.h>
#include <sys/utsname.h>
#include <sys/wait.h>
@ -88,6 +89,131 @@ struct blkpg_partition {
aren't permitted). */
#define BUILD_BUG_ON_ZERO(e) (sizeof(struct { int:-!!(e); }))
static struct dlm_hooks *dlm_hooks = NULL;
static int is_dlm_hooks_ready = 0;
struct dlm_lock_resource *dlm_lock_res = NULL;
static int ast_called = 0;
struct dlm_lock_resource {
dlm_lshandle_t *ls;
struct dlm_lksb lksb;
};
int is_clustered(struct supertype *st)
{
/* is it a cluster md or not */
if (is_dlm_hooks_ready && st->cluster_name)
return 1;
else
return 0;
}
/* Using poll(2) to wait for and dispatch ASTs */
static int poll_for_ast(dlm_lshandle_t ls)
{
struct pollfd pfd;
pfd.fd = dlm_hooks->ls_get_fd(ls);
pfd.events = POLLIN;
while (!ast_called)
{
if (poll(&pfd, 1, 0) < 0)
{
perror("poll");
return -1;
}
dlm_hooks->dispatch(dlm_hooks->ls_get_fd(ls));
}
ast_called = 0;
return 0;
}
static void dlm_ast(void *arg)
{
ast_called = 1;
}
/* Create the lockspace, take bitmapXXX locks on all the bitmaps. */
int cluster_get_dlmlock(struct supertype *st, int *lockid)
{
int ret = -1;
char str[64];
int flags = LKF_NOQUEUE;
dlm_lock_res = xmalloc(sizeof(struct dlm_lock_resource));
dlm_lock_res->ls = dlm_hooks->create_lockspace(st->cluster_name, O_RDWR);
if (!dlm_lock_res->ls) {
pr_err("%s failed to create lockspace\n", st->cluster_name);
goto out;
}
/* Conversions need the lockid in the LKSB */
if (flags & LKF_CONVERT)
dlm_lock_res->lksb.sb_lkid = *lockid;
snprintf(str, 64, "bitmap%04d", st->nodes);
/* if flags with LKF_CONVERT causes below return ENOENT which means
* "No such file or directory" */
ret = dlm_hooks->ls_lock(dlm_lock_res->ls, LKM_PWMODE, &dlm_lock_res->lksb,
flags, str, strlen(str), 0, dlm_ast,
dlm_lock_res, NULL, NULL);
if (ret) {
pr_err("error %d when get PW mode on lock %s\n", errno, str);
goto out;
}
/* Wait for it to complete */
poll_for_ast(dlm_lock_res->ls);
*lockid = dlm_lock_res->lksb.sb_lkid;
errno = dlm_lock_res->lksb.sb_status;
if (errno) {
pr_err("error %d happened in ast with lock %s\n", errno, str);
goto out;
}
out:
return ret;
}
int cluster_release_dlmlock(struct supertype *st, int lockid)
{
int ret = -1;
/* if flags with LKF_CONVERT causes below return EINVAL which means
* "Invalid argument" */
ret = dlm_hooks->ls_unlock(dlm_lock_res->ls, lockid, 0,
&dlm_lock_res->lksb, dlm_lock_res);
if (ret) {
pr_err("error %d happened when unlock\n", errno);
/* XXX make sure the lock is unlocked eventually */
goto out;
}
/* Wait for it to complete */
poll_for_ast(dlm_lock_res->ls);
errno = dlm_lock_res->lksb.sb_status;
if (errno != EUNLOCK) {
pr_err("error %d happened in ast when unlock lockspace\n", errno);
/* XXX make sure the lockspace is unlocked eventually */
goto out;
}
ret = dlm_hooks->release_lockspace(st->cluster_name, dlm_lock_res->ls, 1);
if (ret) {
pr_err("error %d happened when release lockspace\n", errno);
/* XXX make sure the lockspace is released eventually */
goto out;
}
free(dlm_lock_res);
out:
return ret;
}
/*
* Parse a 128 bit uuid in 4 integers
* format is 32 hexx nibbles with options :.<space> separator
@ -2043,4 +2169,26 @@ out:
dlclose(lib_handle);
return rv;
}
void set_dlm_hooks(void)
{
dlm_hooks = xmalloc(sizeof(struct dlm_hooks));
dlm_hooks->dlm_handle = dlopen("libdlm_lt.so.3", RTLD_NOW | RTLD_LOCAL);
if (!dlm_hooks->dlm_handle)
return;
dlm_hooks->create_lockspace = dlsym(dlm_hooks->dlm_handle, "dlm_create_lockspace");
dlm_hooks->release_lockspace = dlsym(dlm_hooks->dlm_handle, "dlm_release_lockspace");
dlm_hooks->ls_lock = dlsym(dlm_hooks->dlm_handle, "dlm_ls_lock");
dlm_hooks->ls_unlock = dlsym(dlm_hooks->dlm_handle, "dlm_ls_unlock");
dlm_hooks->ls_get_fd = dlsym(dlm_hooks->dlm_handle, "dlm_ls_get_fd");
dlm_hooks->dispatch = dlsym(dlm_hooks->dlm_handle, "dlm_dispatch");
if (!dlm_hooks->create_lockspace || !dlm_hooks->ls_lock ||
!dlm_hooks->ls_unlock || !dlm_hooks->release_lockspace ||
!dlm_hooks->ls_get_fd || !dlm_hooks->dispatch)
dlclose(dlm_hooks->dlm_handle);
else
is_dlm_hooks_ready = 1;
}
#endif