pnfs: proper handling of pnfs COMMITs
COMMIT-to-ds: if pnfs_write() finds that its data server requests weren't written stably, it must fail with PNFSERR_IO instead of sending a COMMIT to the mds. mds COMMITs can only be used for mds WRITEs in this configuration COMMIT-to-mds: the mds and data servers are required to use a common write/commit verifier, so the mds COMMIT's verifier must be checked against all ds verifiers Signed-off-by: Casey Bodley <cbodley@citi.umich.edu>
This commit is contained in:
parent
db7caebe28
commit
18d462a37e
1 changed files with 57 additions and 20 deletions
|
|
@ -45,6 +45,7 @@ typedef struct __pnfs_io_pattern {
|
||||||
} pnfs_io_pattern;
|
} pnfs_io_pattern;
|
||||||
|
|
||||||
typedef struct __pnfs_io_thread {
|
typedef struct __pnfs_io_thread {
|
||||||
|
nfs41_write_verf verf;
|
||||||
pnfs_io_pattern *pattern;
|
pnfs_io_pattern *pattern;
|
||||||
pnfs_file_layout *layout;
|
pnfs_file_layout *layout;
|
||||||
nfs41_path_fh *file;
|
nfs41_path_fh *file;
|
||||||
|
|
@ -552,7 +553,6 @@ static uint32_t WINAPI file_layout_write_thread(void *args)
|
||||||
{
|
{
|
||||||
pnfs_io_unit io;
|
pnfs_io_unit io;
|
||||||
stateid_arg stateid;
|
stateid_arg stateid;
|
||||||
nfs41_write_verf verf;
|
|
||||||
pnfs_io_thread *thread = (pnfs_io_thread*)args;
|
pnfs_io_thread *thread = (pnfs_io_thread*)args;
|
||||||
pnfs_io_pattern *pattern = thread->pattern;
|
pnfs_io_pattern *pattern = thread->pattern;
|
||||||
pnfs_data_server *server;
|
pnfs_data_server *server;
|
||||||
|
|
@ -597,16 +597,16 @@ retry_write:
|
||||||
if (io.length > maxwritesize)
|
if (io.length > maxwritesize)
|
||||||
io.length = maxwritesize;
|
io.length = maxwritesize;
|
||||||
|
|
||||||
nfsstat = nfs41_write(client->session, thread->file, &stateid, io.buffer,
|
nfsstat = nfs41_write(client->session, thread->file, &stateid,
|
||||||
(uint32_t)io.length, io.offset, UNSTABLE4, &bytes_written,
|
io.buffer, (uint32_t)io.length, io.offset, UNSTABLE4,
|
||||||
&verf, NULL);
|
&bytes_written, &thread->verf, NULL);
|
||||||
if (nfsstat) {
|
if (nfsstat) {
|
||||||
eprintf("nfs41_write() failed with %s\n",
|
eprintf("nfs41_write() failed with %s\n",
|
||||||
nfs_error_string(nfsstat));
|
nfs_error_string(nfsstat));
|
||||||
status = map_ds_error(nfsstat, pattern->state, thread->layout);
|
status = map_ds_error(nfsstat, pattern->state, thread->layout);
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
if (!verify_write(&verf, &thread->stable))
|
if (!verify_write(&thread->verf, &thread->stable))
|
||||||
goto retry_write;
|
goto retry_write;
|
||||||
|
|
||||||
total_written += bytes_written;
|
total_written += bytes_written;
|
||||||
|
|
@ -635,11 +635,11 @@ retry_write:
|
||||||
dprintf(1, "sending COMMIT to data server for offset=%lld len=%lld\n",
|
dprintf(1, "sending COMMIT to data server for offset=%lld len=%lld\n",
|
||||||
commit_min, commit_max - commit_min);
|
commit_min, commit_max - commit_min);
|
||||||
nfsstat = nfs41_commit(client->session, thread->file,
|
nfsstat = nfs41_commit(client->session, thread->file,
|
||||||
commit_min, (uint32_t)(commit_max - commit_min), 0, &verf, NULL);
|
commit_min, (uint32_t)(commit_max - commit_min), 0, &thread->verf, NULL);
|
||||||
|
|
||||||
if (nfsstat)
|
if (nfsstat)
|
||||||
status = map_ds_error(nfsstat, pattern->state, thread->layout);
|
status = map_ds_error(nfsstat, pattern->state, thread->layout);
|
||||||
else if (!verify_commit(&verf)) {
|
else if (!verify_commit(&thread->verf)) {
|
||||||
/* resend the writes unless the layout was recalled */
|
/* resend the writes unless the layout was recalled */
|
||||||
if (status != PNFSERR_LAYOUT_RECALLED)
|
if (status != PNFSERR_LAYOUT_RECALLED)
|
||||||
goto retry_write;
|
goto retry_write;
|
||||||
|
|
@ -711,6 +711,54 @@ out:
|
||||||
return status;
|
return status;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static enum pnfs_status mds_commit(
|
||||||
|
IN nfs41_open_state *state,
|
||||||
|
IN uint64_t offset,
|
||||||
|
IN uint32_t length,
|
||||||
|
IN const pnfs_io_pattern *pattern,
|
||||||
|
OUT nfs41_file_info *info)
|
||||||
|
{
|
||||||
|
nfs41_write_verf verf;
|
||||||
|
enum nfsstat4 nfsstat;
|
||||||
|
enum pnfs_status status = PNFS_SUCCESS;
|
||||||
|
uint32_t i;
|
||||||
|
|
||||||
|
nfsstat = nfs41_commit(state->session,
|
||||||
|
&state->file, offset, length, 1, &verf, info);
|
||||||
|
if (nfsstat) {
|
||||||
|
eprintf("nfs41_commit() to mds failed with %s\n",
|
||||||
|
nfs_error_string(nfsstat));
|
||||||
|
status = PNFSERR_IO;
|
||||||
|
goto out;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* 13.7. COMMIT through Metadata Server:
|
||||||
|
* If nfl_util & NFL4_UFLG_COMMIT_THRU_MDS is TRUE, then in order to
|
||||||
|
* maintain the current NFSv4.1 commit and recovery model, the data
|
||||||
|
* servers MUST return a common writeverf verifier in all WRITE
|
||||||
|
* responses for a given file layout, and the metadata server's
|
||||||
|
* COMMIT implementation must return the same writeverf. */
|
||||||
|
for (i = 0; i < pattern->count; i++) {
|
||||||
|
const pnfs_io_thread *thread = &pattern->threads[i];
|
||||||
|
if (thread->stable != UNSTABLE4) /* already committed */
|
||||||
|
continue;
|
||||||
|
|
||||||
|
if (!should_commit_to_mds(thread->layout)) {
|
||||||
|
/* commit to mds is not allowed on this layout */
|
||||||
|
eprintf("mds commit: failed to commit to data server\n");
|
||||||
|
status = PNFSERR_IO;
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
if (memcmp(verf.verf, thread->verf.verf, NFS4_VERIFIER_SIZE) != 0) {
|
||||||
|
eprintf("mds commit verifier doesn't match ds write verifiers\n");
|
||||||
|
status = PNFSERR_IO;
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
out:
|
||||||
|
return status;
|
||||||
|
}
|
||||||
|
|
||||||
static enum pnfs_status layout_commit(
|
static enum pnfs_status layout_commit(
|
||||||
IN nfs41_open_state *state,
|
IN nfs41_open_state *state,
|
||||||
IN pnfs_layout_state *layout,
|
IN pnfs_layout_state *layout,
|
||||||
|
|
@ -764,7 +812,6 @@ enum pnfs_status pnfs_write(
|
||||||
pnfs_io_pattern pattern;
|
pnfs_io_pattern pattern;
|
||||||
enum stable_how4 stable;
|
enum stable_how4 stable;
|
||||||
enum pnfs_status status;
|
enum pnfs_status status;
|
||||||
enum nfsstat4 nfsstat;
|
|
||||||
|
|
||||||
dprintf(IOLVL, "--> pnfs_write(%llu, %llu)\n", offset, length);
|
dprintf(IOLVL, "--> pnfs_write(%llu, %llu)\n", offset, length);
|
||||||
|
|
||||||
|
|
@ -804,18 +851,8 @@ enum pnfs_status pnfs_write(
|
||||||
goto out_free_pattern;
|
goto out_free_pattern;
|
||||||
|
|
||||||
if (stable == UNSTABLE4) {
|
if (stable == UNSTABLE4) {
|
||||||
nfs41_write_verf ignored;
|
/* send COMMIT to the mds and verify against all ds writes */
|
||||||
|
status = mds_commit(state, offset, *len_out, &pattern, info);
|
||||||
/* not all data was committed, so commit to metadata server */
|
|
||||||
dprintf(1, "sending COMMIT to meta server for offset=%lld len=%lld\n",
|
|
||||||
offset, *len_out);
|
|
||||||
nfsstat = nfs41_commit(state->session, &state->file,
|
|
||||||
offset, *len_out, 1, &ignored, info);
|
|
||||||
if (nfsstat) {
|
|
||||||
dprintf(IOLVL, "nfs41_commit() failed with %s\n",
|
|
||||||
nfs_error_string(nfsstat));
|
|
||||||
status = PNFSERR_IO;
|
|
||||||
}
|
|
||||||
} else if (stable == DATA_SYNC4) {
|
} else if (stable == DATA_SYNC4) {
|
||||||
/* send LAYOUTCOMMIT to sync the metadata */
|
/* send LAYOUTCOMMIT to sync the metadata */
|
||||||
status = layout_commit(state, layout, offset, *len_out, info);
|
status = layout_commit(state, layout, offset, *len_out, info);
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue