dm log: userspace add luid to distinguish between concurrent log instances

Device-mapper userspace logs (like the clustered log) are
identified by a universally unique identifier (UUID).  This
identifier is used to associate requests from the kernel to
a specific log in userspace.  The UUID must be unique everywhere,
since multiple machines may use this identifier when communicating
about a particular log, as is the case for cluster logs.

Sometimes, device-mapper/LVM may re-use a UUID.  This is the
case during pvmoves, when moving from one segment of an LV
to another, or when resizing a mirror, etc.  In these cases,
a new log is created with the same UUID and loaded in the
"inactive" slot.  When a device-mapper "resume" is issued,
the "live" table is deactivated and the new "inactive" table
becomes "live".  (The "inactive" table can also be removed
via a device-mapper 'clear' command.)

The above two issues were colliding.  More than one log was being
created with the same UUID, and there was no way to distinguish
between them.  So, sometimes the wrong log would be swapped
out during the exchange.

The solution is to create a locally unique identifier,
'luid', to go along with the UUID.  This new identifier is used
to determine exactly which log is being referenced by the kernel
when the log exchange is made.  The identifier is not
universally safe, but it does not need to be, since
create/destroy/suspend/resume operations are bound to a specific
machine; and these are the operations that make up the exchange.

Signed-off-by: Jonathan Brassow <jbrassow@redhat.com>
Signed-off-by: Alasdair G Kergon <agk@redhat.com>
This commit is contained in:
Jonathan Brassow 2009-09-04 20:40:34 +01:00 committed by Alasdair G Kergon
parent d2b698644c
commit 7ec23d5094
4 changed files with 31 additions and 13 deletions

View file

@ -21,6 +21,7 @@ struct log_c {
struct dm_target *ti; struct dm_target *ti;
uint32_t region_size; uint32_t region_size;
region_t region_count; region_t region_count;
uint64_t luid;
char uuid[DM_UUID_LEN]; char uuid[DM_UUID_LEN];
char *usr_argv_str; char *usr_argv_str;
@ -63,7 +64,7 @@ static int userspace_do_request(struct log_c *lc, const char *uuid,
* restored. * restored.
*/ */
retry: retry:
r = dm_consult_userspace(uuid, request_type, data, r = dm_consult_userspace(uuid, lc->luid, request_type, data,
data_size, rdata, rdata_size); data_size, rdata, rdata_size);
if (r != -ESRCH) if (r != -ESRCH)
@ -74,14 +75,15 @@ retry:
set_current_state(TASK_INTERRUPTIBLE); set_current_state(TASK_INTERRUPTIBLE);
schedule_timeout(2*HZ); schedule_timeout(2*HZ);
DMWARN("Attempting to contact userspace log server..."); DMWARN("Attempting to contact userspace log server...");
r = dm_consult_userspace(uuid, DM_ULOG_CTR, lc->usr_argv_str, r = dm_consult_userspace(uuid, lc->luid, DM_ULOG_CTR,
lc->usr_argv_str,
strlen(lc->usr_argv_str) + 1, strlen(lc->usr_argv_str) + 1,
NULL, NULL); NULL, NULL);
if (!r) if (!r)
break; break;
} }
DMINFO("Reconnected to userspace log server... DM_ULOG_CTR complete"); DMINFO("Reconnected to userspace log server... DM_ULOG_CTR complete");
r = dm_consult_userspace(uuid, DM_ULOG_RESUME, NULL, r = dm_consult_userspace(uuid, lc->luid, DM_ULOG_RESUME, NULL,
0, NULL, NULL); 0, NULL, NULL);
if (!r) if (!r)
goto retry; goto retry;
@ -153,6 +155,9 @@ static int userspace_ctr(struct dm_dirty_log *log, struct dm_target *ti,
return -ENOMEM; return -ENOMEM;
} }
/* The ptr value is sufficient for local unique id */
lc->luid = (uint64_t)lc;
lc->ti = ti; lc->ti = ti;
if (strlen(argv[0]) > (DM_UUID_LEN - 1)) { if (strlen(argv[0]) > (DM_UUID_LEN - 1)) {
@ -172,7 +177,7 @@ static int userspace_ctr(struct dm_dirty_log *log, struct dm_target *ti,
} }
/* Send table string */ /* Send table string */
r = dm_consult_userspace(lc->uuid, DM_ULOG_CTR, r = dm_consult_userspace(lc->uuid, lc->luid, DM_ULOG_CTR,
ctr_str, str_size, NULL, NULL); ctr_str, str_size, NULL, NULL);
if (r == -ESRCH) { if (r == -ESRCH) {
@ -182,7 +187,7 @@ static int userspace_ctr(struct dm_dirty_log *log, struct dm_target *ti,
/* Since the region size does not change, get it now */ /* Since the region size does not change, get it now */
rdata_size = sizeof(rdata); rdata_size = sizeof(rdata);
r = dm_consult_userspace(lc->uuid, DM_ULOG_GET_REGION_SIZE, r = dm_consult_userspace(lc->uuid, lc->luid, DM_ULOG_GET_REGION_SIZE,
NULL, 0, (char *)&rdata, &rdata_size); NULL, 0, (char *)&rdata, &rdata_size);
if (r) { if (r) {
@ -211,7 +216,7 @@ static void userspace_dtr(struct dm_dirty_log *log)
int r; int r;
struct log_c *lc = log->context; struct log_c *lc = log->context;
r = dm_consult_userspace(lc->uuid, DM_ULOG_DTR, r = dm_consult_userspace(lc->uuid, lc->luid, DM_ULOG_DTR,
NULL, 0, NULL, 0,
NULL, NULL); NULL, NULL);
@ -226,7 +231,7 @@ static int userspace_presuspend(struct dm_dirty_log *log)
int r; int r;
struct log_c *lc = log->context; struct log_c *lc = log->context;
r = dm_consult_userspace(lc->uuid, DM_ULOG_PRESUSPEND, r = dm_consult_userspace(lc->uuid, lc->luid, DM_ULOG_PRESUSPEND,
NULL, 0, NULL, 0,
NULL, NULL); NULL, NULL);
@ -238,7 +243,7 @@ static int userspace_postsuspend(struct dm_dirty_log *log)
int r; int r;
struct log_c *lc = log->context; struct log_c *lc = log->context;
r = dm_consult_userspace(lc->uuid, DM_ULOG_POSTSUSPEND, r = dm_consult_userspace(lc->uuid, lc->luid, DM_ULOG_POSTSUSPEND,
NULL, 0, NULL, 0,
NULL, NULL); NULL, NULL);
@ -251,7 +256,7 @@ static int userspace_resume(struct dm_dirty_log *log)
struct log_c *lc = log->context; struct log_c *lc = log->context;
lc->in_sync_hint = 0; lc->in_sync_hint = 0;
r = dm_consult_userspace(lc->uuid, DM_ULOG_RESUME, r = dm_consult_userspace(lc->uuid, lc->luid, DM_ULOG_RESUME,
NULL, 0, NULL, 0,
NULL, NULL); NULL, NULL);

View file

@ -147,7 +147,8 @@ static void cn_ulog_callback(void *data)
/** /**
* dm_consult_userspace * dm_consult_userspace
* @uuid: log's uuid (must be DM_UUID_LEN in size) * @uuid: log's universal unique identifier (must be DM_UUID_LEN in size)
* @luid: log's local unique identifier
* @request_type: found in include/linux/dm-log-userspace.h * @request_type: found in include/linux/dm-log-userspace.h
* @data: data to tx to the server * @data: data to tx to the server
* @data_size: size of data in bytes * @data_size: size of data in bytes
@ -163,7 +164,7 @@ static void cn_ulog_callback(void *data)
* *
* Returns: 0 on success, -EXXX on failure * Returns: 0 on success, -EXXX on failure
**/ **/
int dm_consult_userspace(const char *uuid, int request_type, int dm_consult_userspace(const char *uuid, uint64_t luid, int request_type,
char *data, size_t data_size, char *data, size_t data_size,
char *rdata, size_t *rdata_size) char *rdata, size_t *rdata_size)
{ {
@ -190,6 +191,7 @@ resend:
memset(tfr, 0, DM_ULOG_PREALLOCED_SIZE - overhead_size); memset(tfr, 0, DM_ULOG_PREALLOCED_SIZE - overhead_size);
memcpy(tfr->uuid, uuid, DM_UUID_LEN); memcpy(tfr->uuid, uuid, DM_UUID_LEN);
tfr->luid = luid;
tfr->seq = dm_ulog_seq++; tfr->seq = dm_ulog_seq++;
/* /*

View file

@ -11,7 +11,7 @@
int dm_ulog_tfr_init(void); int dm_ulog_tfr_init(void);
void dm_ulog_tfr_exit(void); void dm_ulog_tfr_exit(void);
int dm_consult_userspace(const char *uuid, int request_type, int dm_consult_userspace(const char *uuid, uint64_t luid, int request_type,
char *data, size_t data_size, char *data, size_t data_size,
char *rdata, size_t *rdata_size); char *rdata, size_t *rdata_size);

View file

@ -371,7 +371,18 @@
(DM_ULOG_REQUEST_MASK & (request_type)) (DM_ULOG_REQUEST_MASK & (request_type))
struct dm_ulog_request { struct dm_ulog_request {
char uuid[DM_UUID_LEN]; /* Ties a request to a specific mirror log */ /*
* The local unique identifier (luid) and the universally unique
* identifier (uuid) are used to tie a request to a specific
* mirror log. A single machine log could probably make due with
* just the 'luid', but a cluster-aware log must use the 'uuid' and
* the 'luid'. The uuid is what is required for node to node
* communication concerning a particular log, but the 'luid' helps
* differentiate between logs that are being swapped and have the
* same 'uuid'. (Think "live" and "inactive" device-mapper tables.)
*/
uint64_t luid;
char uuid[DM_UUID_LEN];
char padding[7]; /* Padding because DM_UUID_LEN = 129 */ char padding[7]; /* Padding because DM_UUID_LEN = 129 */
int32_t error; /* Used to report back processing errors */ int32_t error; /* Used to report back processing errors */