- Speed up synchronization process by using configurable number of I/O

requests in parallel.
  + Add kern.geom.mirror.sync_requests tunable which defines how many parallel
    I/O requests should be used.
  + Retire kern.geom.mirror.reqs_per_sync and kern.geom.mirror.syncs_per_sec
    sysctls.
- Fix race between regular and synchronization requests.
- Reimplement mirror's data synchronization - do not use the topology lock
  for this purpose, as it may case deadlocks.
- Stop synchronization from pre-sync hook.
- Fix some other minor issues.

MFC after:	3 days
This commit is contained in:
Pawel Jakub Dawidek 2006-03-13 00:58:41 +00:00
parent c053f1f8ac
commit 855761d5db
3 changed files with 561 additions and 276 deletions

File diff suppressed because it is too large Load Diff

View File

@ -103,9 +103,9 @@ struct g_mirror_disk_sync {
off_t ds_offset; /* Offset of next request to send. */ off_t ds_offset; /* Offset of next request to send. */
off_t ds_offset_done; /* Offset of already synchronized off_t ds_offset_done; /* Offset of already synchronized
region. */ region. */
off_t ds_resync; /* Resynchronize from this offset. */
u_int ds_syncid; /* Disk's synchronization ID. */ u_int ds_syncid; /* Disk's synchronization ID. */
u_char *ds_data; u_int ds_inflight; /* Number of in-flight sync requests. */
struct bio **ds_bios; /* BIOs for synchronization I/O. */
}; };
/* /*
@ -174,9 +174,18 @@ struct g_mirror_softc {
uint32_t sc_id; /* Mirror unique ID. */ uint32_t sc_id; /* Mirror unique ID. */
struct sx sc_lock;
struct bio_queue_head sc_queue; struct bio_queue_head sc_queue;
struct mtx sc_queue_mtx; struct mtx sc_queue_mtx;
struct proc *sc_worker; struct proc *sc_worker;
struct bio_queue_head sc_regular_delayed; /* Delayed I/O requests due
collision with sync
requests. */
struct bio_queue_head sc_inflight; /* In-flight regular write
requests. */
struct bio_queue_head sc_sync_delayed; /* Delayed sync requests due
collision with regular
requests. */
LIST_HEAD(, g_mirror_disk) sc_disks; LIST_HEAD(, g_mirror_disk) sc_disks;
u_int sc_ndisks; /* Number of disks. */ u_int sc_ndisks; /* Number of disks. */

View File

@ -51,7 +51,7 @@ g_mirror_find_device(struct g_class *mp, const char *name)
struct g_mirror_softc *sc; struct g_mirror_softc *sc;
struct g_geom *gp; struct g_geom *gp;
g_topology_assert(); g_topology_lock();
LIST_FOREACH(gp, &mp->geom, geom) { LIST_FOREACH(gp, &mp->geom, geom) {
sc = gp->softc; sc = gp->softc;
if (sc == NULL) if (sc == NULL)
@ -60,9 +60,12 @@ g_mirror_find_device(struct g_class *mp, const char *name)
continue; continue;
if (strcmp(gp->name, name) == 0 || if (strcmp(gp->name, name) == 0 ||
strcmp(sc->sc_name, name) == 0) { strcmp(sc->sc_name, name) == 0) {
g_topology_unlock();
sx_xlock(&sc->sc_lock);
return (sc); return (sc);
} }
} }
g_topology_unlock();
return (NULL); return (NULL);
} }
@ -71,7 +74,7 @@ g_mirror_find_disk(struct g_mirror_softc *sc, const char *name)
{ {
struct g_mirror_disk *disk; struct g_mirror_disk *disk;
g_topology_assert(); sx_assert(&sc->sc_lock, SX_XLOCKED);
LIST_FOREACH(disk, &sc->sc_disks, d_next) { LIST_FOREACH(disk, &sc->sc_disks, d_next) {
if (disk->d_consumer == NULL) if (disk->d_consumer == NULL)
continue; continue;
@ -94,7 +97,6 @@ g_mirror_ctl_configure(struct gctl_req *req, struct g_class *mp)
uint8_t balance; uint8_t balance;
int *nargs, *autosync, *noautosync, *hardcode, *dynamic, do_sync = 0; int *nargs, *autosync, *noautosync, *hardcode, *dynamic, do_sync = 0;
g_topology_assert();
nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs)); nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs));
if (nargs == NULL) { if (nargs == NULL) {
gctl_error(req, "No '%s' argument.", "nargs"); gctl_error(req, "No '%s' argument.", "nargs");
@ -109,38 +111,11 @@ g_mirror_ctl_configure(struct gctl_req *req, struct g_class *mp)
gctl_error(req, "No 'arg%u' argument.", 0); gctl_error(req, "No 'arg%u' argument.", 0);
return; return;
} }
sc = g_mirror_find_device(mp, name);
if (sc == NULL) {
gctl_error(req, "No such device: %s.", name);
return;
}
if (g_mirror_ndisks(sc, -1) < sc->sc_ndisks) {
gctl_error(req, "Not all disks connected.");
return;
}
balancep = gctl_get_asciiparam(req, "balance"); balancep = gctl_get_asciiparam(req, "balance");
if (balancep == NULL) { if (balancep == NULL) {
gctl_error(req, "No '%s' argument.", "balance"); gctl_error(req, "No '%s' argument.", "balance");
return; return;
} }
if (strcmp(balancep, "none") == 0)
balance = sc->sc_balance;
else {
if (balance_id(balancep) == -1) {
gctl_error(req, "Invalid balance algorithm.");
return;
}
balance = balance_id(balancep);
}
slicep = gctl_get_paraml(req, "slice", sizeof(*slicep));
if (slicep == NULL) {
gctl_error(req, "No '%s' argument.", "slice");
return;
}
if (*slicep == -1)
slice = sc->sc_slice;
else
slice = *slicep;
autosync = gctl_get_paraml(req, "autosync", sizeof(*autosync)); autosync = gctl_get_paraml(req, "autosync", sizeof(*autosync));
if (autosync == NULL) { if (autosync == NULL) {
gctl_error(req, "No '%s' argument.", "autosync"); gctl_error(req, "No '%s' argument.", "autosync");
@ -161,11 +136,6 @@ g_mirror_ctl_configure(struct gctl_req *req, struct g_class *mp)
gctl_error(req, "No '%s' argument.", "dynamic"); gctl_error(req, "No '%s' argument.", "dynamic");
return; return;
} }
if (sc->sc_balance == balance && sc->sc_slice == slice && !*autosync &&
!*noautosync && !*hardcode && !*dynamic) {
gctl_error(req, "Nothing has changed.");
return;
}
if (*autosync && *noautosync) { if (*autosync && *noautosync) {
gctl_error(req, "'%s' and '%s' specified.", "autosync", gctl_error(req, "'%s' and '%s' specified.", "autosync",
"noautosync"); "noautosync");
@ -176,6 +146,43 @@ g_mirror_ctl_configure(struct gctl_req *req, struct g_class *mp)
"dynamic"); "dynamic");
return; return;
} }
sc = g_mirror_find_device(mp, name);
if (sc == NULL) {
gctl_error(req, "No such device: %s.", name);
return;
}
if (strcmp(balancep, "none") == 0)
balance = sc->sc_balance;
else {
if (balance_id(balancep) == -1) {
gctl_error(req, "Invalid balance algorithm.");
sx_xunlock(&sc->sc_lock);
return;
}
balance = balance_id(balancep);
}
slicep = gctl_get_paraml(req, "slice", sizeof(*slicep));
if (slicep == NULL) {
gctl_error(req, "No '%s' argument.", "slice");
sx_xunlock(&sc->sc_lock);
return;
}
if (*slicep == -1)
slice = sc->sc_slice;
else
slice = *slicep;
if (g_mirror_ndisks(sc, -1) < sc->sc_ndisks) {
sx_xunlock(&sc->sc_lock);
gctl_error(req, "Not all disks connected. Try 'forget' command "
"first.");
return;
}
if (sc->sc_balance == balance && sc->sc_slice == slice && !*autosync &&
!*noautosync && !*hardcode && !*dynamic) {
sx_xunlock(&sc->sc_lock);
gctl_error(req, "Nothing has changed.");
return;
}
sc->sc_balance = balance; sc->sc_balance = balance;
sc->sc_slice = slice; sc->sc_slice = slice;
if ((sc->sc_flags & G_MIRROR_DEVICE_FLAG_NOAUTOSYNC) != 0) { if ((sc->sc_flags & G_MIRROR_DEVICE_FLAG_NOAUTOSYNC) != 0) {
@ -205,6 +212,7 @@ g_mirror_ctl_configure(struct gctl_req *req, struct g_class *mp)
} }
} }
} }
sx_xunlock(&sc->sc_lock);
} }
static void static void
@ -219,7 +227,6 @@ g_mirror_ctl_rebuild(struct gctl_req *req, struct g_class *mp)
int error, *nargs; int error, *nargs;
u_int i; u_int i;
g_topology_assert();
nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs)); nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs));
if (nargs == NULL) { if (nargs == NULL) {
gctl_error(req, "No '%s' argument.", "nargs"); gctl_error(req, "No '%s' argument.", "nargs");
@ -239,7 +246,6 @@ g_mirror_ctl_rebuild(struct gctl_req *req, struct g_class *mp)
gctl_error(req, "No such device: %s.", name); gctl_error(req, "No such device: %s.", name);
return; return;
} }
for (i = 1; i < (u_int)*nargs; i++) { for (i = 1; i < (u_int)*nargs; i++) {
snprintf(param, sizeof(param), "arg%u", i); snprintf(param, sizeof(param), "arg%u", i);
name = gctl_get_asciiparam(req, param); name = gctl_get_asciiparam(req, param);
@ -261,7 +267,7 @@ g_mirror_ctl_rebuild(struct gctl_req *req, struct g_class *mp)
gctl_error(req, gctl_error(req,
"Provider %s is the last active provider in %s.", "Provider %s is the last active provider in %s.",
name, sc->sc_geom->name); name, sc->sc_geom->name);
return; break;
} }
/* /*
* Do rebuild by resetting syncid, disconnecting the disk and * Do rebuild by resetting syncid, disconnecting the disk and
@ -272,7 +278,9 @@ g_mirror_ctl_rebuild(struct gctl_req *req, struct g_class *mp)
disk->d_flags |= G_MIRROR_DISK_FLAG_FORCE_SYNC; disk->d_flags |= G_MIRROR_DISK_FLAG_FORCE_SYNC;
g_mirror_update_metadata(disk); g_mirror_update_metadata(disk);
pp = disk->d_consumer->provider; pp = disk->d_consumer->provider;
g_topology_lock();
error = g_mirror_read_metadata(disk->d_consumer, &md); error = g_mirror_read_metadata(disk->d_consumer, &md);
g_topology_unlock();
g_mirror_event_send(disk, G_MIRROR_DISK_STATE_DISCONNECTED, g_mirror_event_send(disk, G_MIRROR_DISK_STATE_DISCONNECTED,
G_MIRROR_EVENT_WAIT); G_MIRROR_EVENT_WAIT);
if (error != 0) { if (error != 0) {
@ -287,6 +295,7 @@ g_mirror_ctl_rebuild(struct gctl_req *req, struct g_class *mp)
continue; continue;
} }
} }
sx_xunlock(&sc->sc_lock);
} }
static void static void
@ -308,7 +317,6 @@ g_mirror_ctl_insert(struct gctl_req *req, struct g_class *mp)
struct g_consumer *consumer; struct g_consumer *consumer;
} *disks; } *disks;
g_topology_assert();
nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs)); nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs));
if (nargs == NULL) { if (nargs == NULL) {
gctl_error(req, "No '%s' argument.", "nargs"); gctl_error(req, "No '%s' argument.", "nargs");
@ -345,10 +353,12 @@ g_mirror_ctl_insert(struct gctl_req *req, struct g_class *mp)
} }
if (g_mirror_ndisks(sc, -1) < sc->sc_ndisks) { if (g_mirror_ndisks(sc, -1) < sc->sc_ndisks) {
gctl_error(req, "Not all disks connected."); gctl_error(req, "Not all disks connected.");
sx_xunlock(&sc->sc_lock);
return; return;
} }
disks = g_malloc(sizeof(*disks) * (*nargs), M_WAITOK | M_ZERO); disks = g_malloc(sizeof(*disks) * (*nargs), M_WAITOK | M_ZERO);
g_topology_lock();
for (i = 1, n = 0; i < (u_int)*nargs; i++) { for (i = 1, n = 0; i < (u_int)*nargs; i++) {
snprintf(param, sizeof(param), "arg%u", i); snprintf(param, sizeof(param), "arg%u", i);
name = gctl_get_asciiparam(req, param); name = gctl_get_asciiparam(req, param);
@ -394,6 +404,8 @@ g_mirror_ctl_insert(struct gctl_req *req, struct g_class *mp)
n++; n++;
} }
if (n == 0) { if (n == 0) {
g_topology_unlock();
sx_xunlock(&sc->sc_lock);
g_free(disks); g_free(disks);
return; return;
} }
@ -431,8 +443,10 @@ again:
goto again; goto again;
} }
} }
g_topology_unlock();
if (i == 0) { if (i == 0) {
/* All writes failed. */ /* All writes failed. */
sx_xunlock(&sc->sc_lock);
g_free(disks); g_free(disks);
return; return;
} }
@ -442,6 +456,7 @@ again:
/* /*
* Release provider and wait for retaste. * Release provider and wait for retaste.
*/ */
g_topology_lock();
for (i = 0; i < n; i++) { for (i = 0; i < n; i++) {
if (disks[i].consumer == NULL) if (disks[i].consumer == NULL)
continue; continue;
@ -449,6 +464,8 @@ again:
g_detach(disks[i].consumer); g_detach(disks[i].consumer);
g_destroy_consumer(disks[i].consumer); g_destroy_consumer(disks[i].consumer);
} }
g_topology_unlock();
sx_xunlock(&sc->sc_lock);
g_free(disks); g_free(disks);
} }
@ -462,7 +479,6 @@ g_mirror_ctl_remove(struct gctl_req *req, struct g_class *mp)
int *nargs; int *nargs;
u_int i; u_int i;
g_topology_assert();
nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs)); nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs));
if (nargs == NULL) { if (nargs == NULL) {
gctl_error(req, "No '%s' argument.", "nargs"); gctl_error(req, "No '%s' argument.", "nargs");
@ -483,10 +499,11 @@ g_mirror_ctl_remove(struct gctl_req *req, struct g_class *mp)
return; return;
} }
if (g_mirror_ndisks(sc, -1) < sc->sc_ndisks) { if (g_mirror_ndisks(sc, -1) < sc->sc_ndisks) {
gctl_error(req, "Not all disks connected."); sx_xunlock(&sc->sc_lock);
gctl_error(req, "Not all disks connected. Try 'forget' command "
"first.");
return; return;
} }
for (i = 1; i < (u_int)*nargs; i++) { for (i = 1; i < (u_int)*nargs; i++) {
snprintf(param, sizeof(param), "arg%u", i); snprintf(param, sizeof(param), "arg%u", i);
name = gctl_get_asciiparam(req, param); name = gctl_get_asciiparam(req, param);
@ -500,8 +517,9 @@ g_mirror_ctl_remove(struct gctl_req *req, struct g_class *mp)
continue; continue;
} }
g_mirror_event_send(disk, G_MIRROR_DISK_STATE_DESTROY, g_mirror_event_send(disk, G_MIRROR_DISK_STATE_DESTROY,
G_MIRROR_EVENT_WAIT); G_MIRROR_EVENT_DONTWAIT);
} }
sx_xunlock(&sc->sc_lock);
} }
static void static void
@ -514,7 +532,6 @@ g_mirror_ctl_deactivate(struct gctl_req *req, struct g_class *mp)
int *nargs; int *nargs;
u_int i; u_int i;
g_topology_assert();
nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs)); nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs));
if (nargs == NULL) { if (nargs == NULL) {
gctl_error(req, "No '%s' argument.", "nargs"); gctl_error(req, "No '%s' argument.", "nargs");
@ -534,7 +551,6 @@ g_mirror_ctl_deactivate(struct gctl_req *req, struct g_class *mp)
gctl_error(req, "No such device: %s.", name); gctl_error(req, "No such device: %s.", name);
return; return;
} }
for (i = 1; i < (u_int)*nargs; i++) { for (i = 1; i < (u_int)*nargs; i++) {
snprintf(param, sizeof(param), "arg%u", i); snprintf(param, sizeof(param), "arg%u", i);
name = gctl_get_asciiparam(req, param); name = gctl_get_asciiparam(req, param);
@ -552,8 +568,9 @@ g_mirror_ctl_deactivate(struct gctl_req *req, struct g_class *mp)
g_mirror_update_metadata(disk); g_mirror_update_metadata(disk);
sc->sc_bump_id |= G_MIRROR_BUMP_SYNCID; sc->sc_bump_id |= G_MIRROR_BUMP_SYNCID;
g_mirror_event_send(disk, G_MIRROR_DISK_STATE_DISCONNECTED, g_mirror_event_send(disk, G_MIRROR_DISK_STATE_DISCONNECTED,
G_MIRROR_EVENT_WAIT); G_MIRROR_EVENT_DONTWAIT);
} }
sx_xunlock(&sc->sc_lock);
} }
static void static void
@ -566,7 +583,6 @@ g_mirror_ctl_forget(struct gctl_req *req, struct g_class *mp)
int *nargs; int *nargs;
u_int i; u_int i;
g_topology_assert();
nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs)); nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs));
if (nargs == NULL) { if (nargs == NULL) {
gctl_error(req, "No '%s' argument.", "nargs"); gctl_error(req, "No '%s' argument.", "nargs");
@ -590,6 +606,7 @@ g_mirror_ctl_forget(struct gctl_req *req, struct g_class *mp)
return; return;
} }
if (g_mirror_ndisks(sc, -1) == sc->sc_ndisks) { if (g_mirror_ndisks(sc, -1) == sc->sc_ndisks) {
sx_xunlock(&sc->sc_lock);
G_MIRROR_DEBUG(1, G_MIRROR_DEBUG(1,
"All disks connected in %s, skipping.", "All disks connected in %s, skipping.",
sc->sc_name); sc->sc_name);
@ -599,6 +616,7 @@ g_mirror_ctl_forget(struct gctl_req *req, struct g_class *mp)
LIST_FOREACH(disk, &sc->sc_disks, d_next) { LIST_FOREACH(disk, &sc->sc_disks, d_next) {
g_mirror_update_metadata(disk); g_mirror_update_metadata(disk);
} }
sx_xunlock(&sc->sc_lock);
} }
} }
@ -611,8 +629,6 @@ g_mirror_ctl_stop(struct gctl_req *req, struct g_class *mp)
char param[16]; char param[16];
u_int i; u_int i;
g_topology_assert();
nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs)); nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs));
if (nargs == NULL) { if (nargs == NULL) {
gctl_error(req, "No '%s' argument.", "nargs"); gctl_error(req, "No '%s' argument.", "nargs");
@ -644,8 +660,10 @@ g_mirror_ctl_stop(struct gctl_req *req, struct g_class *mp)
if (error != 0) { if (error != 0) {
gctl_error(req, "Cannot destroy device %s (error=%d).", gctl_error(req, "Cannot destroy device %s (error=%d).",
sc->sc_geom->name, error); sc->sc_geom->name, error);
sx_xunlock(&sc->sc_lock);
return; return;
} }
/* No need to unlock, because lock is already dead. */
} }
} }
@ -666,6 +684,7 @@ g_mirror_config(struct gctl_req *req, struct g_class *mp, const char *verb)
return; return;
} }
g_topology_unlock();
if (strcmp(verb, "configure") == 0) if (strcmp(verb, "configure") == 0)
g_mirror_ctl_configure(req, mp); g_mirror_ctl_configure(req, mp);
else if (strcmp(verb, "rebuild") == 0) else if (strcmp(verb, "rebuild") == 0)
@ -682,4 +701,5 @@ g_mirror_config(struct gctl_req *req, struct g_class *mp, const char *verb)
g_mirror_ctl_stop(req, mp); g_mirror_ctl_stop(req, mp);
else else
gctl_error(req, "Unknown verb."); gctl_error(req, "Unknown verb.");
g_topology_lock();
} }