Richard W.M. Jones
2020-Aug-06 13:16 UTC
[Libguestfs] [PATCH nbdkit NOT WORKING 0/2] vddk: Relax threading model.
I believe this roughly implements Nir's proposal here: https://www.redhat.com/archives/libguestfs/2020-August/msg00028.html Unfortunately it doesn't work for me. It actually slows things down quite a lot, for reasons I don't understand. Note the adjustment of the pool-max parameter and how it affects the total time. The results are quite reproducible. $ ./nbdkit -r -U - vddk libdir=~/tmp/vddk-7.0.0/vmware-vix-disklib-distrib user=root password=*** server=*** thumbprint=*** vm=moref=3 file='[datastore1] Fedora 28/Fedora 28.vmdk' pool-max=1 --run 'time qemu-img convert -p -W -m 16 $nbd /var/tmp/out' (100.00/100%) real 1m8.031s user 0m0.112s sys 0m1.560s $ ./nbdkit -r -U - vddk libdir=~/tmp/vddk-7.0.0/vmware-vix-disklib-distrib user=root password=*** server=*** thumbprint=*** vm=moref=3 file='[datastore1] Fedora 28/Fedora 28.vmdk' pool-max=8 --run 'time qemu-img convert -p -W -m 16 $nbd /var/tmp/out' (100.00/100%) real 1m27.790s user 0m0.099s sys 0m1.625s I'm still investigating this. Could be a simple coding error somewhere. Rich.
Richard W.M. Jones
2020-Aug-06 13:16 UTC
[Libguestfs] [PATCH nbdkit 1/2] vddk: Relax threading model: SERIALIZE_ALL_REQUESTS -> SERIALIZE_REQUESTS.
See comment in code and https://www.redhat.com/archives/libguestfs/2020-August/msg00023.html --- plugins/vddk/vddk.c | 17 +++++++++++++---- 1 file changed, 13 insertions(+), 4 deletions(-) diff --git a/plugins/vddk/vddk.c b/plugins/vddk/vddk.c index c24da96f..5926e181 100644 --- a/plugins/vddk/vddk.c +++ b/plugins/vddk/vddk.c @@ -478,11 +478,18 @@ vddk_dump_plugin (void) #endif } -/* XXX To really do threading correctly in accordance with the VDDK - * documentation, we must do all open/close calls from a single - * thread. This is a huge pain. +/* The rules on threads and VDDK are here: + * https://code.vmware.com/docs/11750/virtual-disk-development-kit-programming-guide/GUID-6BE903E8-DC70-46D9-98E4-E34A2002C2AD.html + * + * Before nbdkit 1.22 we used SERIALIZE_ALL_REQUESTS. Since nbdkit + * 1.22 we changed this to SERIALIZE_REQUESTS and added a mutex around + * calls to VixDiskLib_Open and VixDiskLib_Close. This is not quite + * within the letter of the rules, but is within the spirit. */ -#define THREAD_MODEL NBDKIT_THREAD_MODEL_SERIALIZE_ALL_REQUESTS +#define THREAD_MODEL NBDKIT_THREAD_MODEL_SERIALIZE_REQUESTS + +/* Lock protecting open/close calls - see above. */ +static pthread_mutex_t open_close_lock = PTHREAD_MUTEX_INITIALIZER; /* The per-connection handle. */ struct vddk_handle { @@ -524,6 +531,7 @@ free_connect_params (VixDiskLibConnectParams *params) static void * vddk_open (int readonly) { + ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&open_close_lock); struct vddk_handle *h; VixError err; uint32_t flags; @@ -616,6 +624,7 @@ vddk_open (int readonly) static void vddk_close (void *handle) { + ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&open_close_lock); struct vddk_handle *h = handle; DEBUG_CALL ("VixDiskLib_Close", "handle"); -- 2.27.0
Richard W.M. Jones
2020-Aug-06 13:16 UTC
[Libguestfs] [PATCH nbdkit 2/2] vddk: Relax thread model to PARALLEL and implement a disk handle pool.
The pool is only used for readonly connections, since writable connections usually take a lock on the server side and therefore you cannot open more than one. --- plugins/vddk/nbdkit-vddk-plugin.pod | 7 + plugins/vddk/vddk.c | 201 ++++++++++++++++++++++------ 2 files changed, 164 insertions(+), 44 deletions(-) diff --git a/plugins/vddk/nbdkit-vddk-plugin.pod b/plugins/vddk/nbdkit-vddk-plugin.pod index e5539da9..288aed4b 100644 --- a/plugins/vddk/nbdkit-vddk-plugin.pod +++ b/plugins/vddk/nbdkit-vddk-plugin.pod @@ -175,6 +175,13 @@ Read the password from file descriptor number C<FD>, inherited from the parent process when nbdkit starts up. This is also a secure method to supply a password. +=item B<pool-max=>N + +To improve performance, for read-only connections (see I<-r> option) +the plugin will open a pool of VixDiskLibHandle disk handles. You can +use this option to control the maximum size of the pool. The default +is 8. To disable this feature, set it to 0 or 1. + =item B<port=>PORT The port on the VCenter/ESXi host. Defaults to 443. diff --git a/plugins/vddk/vddk.c b/plugins/vddk/vddk.c index 5926e181..173d5031 100644 --- a/plugins/vddk/vddk.c +++ b/plugins/vddk/vddk.c @@ -52,6 +52,7 @@ #include "isaligned.h" #include "minmax.h" #include "rounding.h" +#include "vector.h" #include "vddk.h" #include "vddk-structs.h" @@ -85,6 +86,7 @@ char *libdir; /* libdir */ static uint16_t nfc_host_port; /* nfchostport */ char *password; /* password */ static uint16_t port; /* port */ +static unsigned pool_max = 8; /* pool-max */ static const char *server_name; /* server */ static bool single_link; /* single-link */ static const char *snapshot_moref; /* snapshot */ @@ -233,6 +235,12 @@ vddk_config (const char *key, const char *value) if (nbdkit_parse_uint16_t ("port", value, &port) == -1) return -1; } + else if (strcmp (key, "pool-max") == 0) { + if (nbdkit_parse_unsigned ("pool-max", value, &pool_max) == -1) + return -1; + if (pool_max < 1) + pool_max = 1; + } else if (strcmp (key, "reexeced_") == 0) { /* Special name because it is only for internal use. */ reexeced = (char *)value; @@ -482,20 +490,37 @@ vddk_dump_plugin (void) * https://code.vmware.com/docs/11750/virtual-disk-development-kit-programming-guide/GUID-6BE903E8-DC70-46D9-98E4-E34A2002C2AD.html * * Before nbdkit 1.22 we used SERIALIZE_ALL_REQUESTS. Since nbdkit - * 1.22 we changed this to SERIALIZE_REQUESTS and added a mutex around - * calls to VixDiskLib_Open and VixDiskLib_Close. This is not quite - * within the letter of the rules, but is within the spirit. + * 1.22 we changed this to PARALLEL, added a mutex around calls to + * VixDiskLib_Open and VixDiskLib_Close, and use a pool of disk + * handles. This is not quite within the letter of the rules, but is + * within the spirit. */ -#define THREAD_MODEL NBDKIT_THREAD_MODEL_SERIALIZE_REQUESTS +#define THREAD_MODEL NBDKIT_THREAD_MODEL_PARALLEL /* Lock protecting open/close calls - see above. */ static pthread_mutex_t open_close_lock = PTHREAD_MUTEX_INITIALIZER; -/* The per-connection handle. */ +struct handle; struct vddk_handle { + VixDiskLibHandle vddk_handle; + bool in_use; + struct handle *h; +}; +DEFINE_VECTOR_TYPE(vddk_handles, struct vddk_handle) + +/* The per-connection handle. */ +struct handle { VixDiskLibConnectParams *params; /* connection parameters */ VixDiskLibConnection connection; /* connection */ - VixDiskLibHandle handle; /* disk handle */ + int readonly; /* readonly flag for this connection */ + uint32_t flags; /* open flags */ + + /* Pool of VDDK disk handles. Do not access this directly, use + * GET_VDDK_HANDLE_FOR_CURRENT_SCOPE macro to get a free handle. + */ + pthread_mutex_t vddk_handles_lock; + pthread_cond_t vddk_handles_cond; + vddk_handles vddk_handles; }; static inline VixDiskLibConnectParams * @@ -531,17 +556,28 @@ free_connect_params (VixDiskLibConnectParams *params) static void * vddk_open (int readonly) { - ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&open_close_lock); - struct vddk_handle *h; + struct handle *h; VixError err; - uint32_t flags; - h = malloc (sizeof *h); + h = calloc (1, sizeof *h); if (h == NULL) { - nbdkit_error ("malloc: %m"); + nbdkit_error ("calloc: %m"); return NULL; } + h->readonly = readonly; + pthread_mutex_init (&h->vddk_handles_lock, NULL); + pthread_cond_init (&h->vddk_handles_cond, NULL); + + /* We have to reserve this vector to ensure that it is not + * reallocated, as that would make the pointer returned by + * get_vddk_handle in another thread invalid. + */ + if (vddk_handles_reserve (&h->vddk_handles, pool_max) == -1) { + nbdkit_error ("realloc: %m"); + goto err0; + } + h->params = allocate_connect_params (); if (h->params == NULL) { nbdkit_error ("allocate VixDiskLibConnectParams: %m"); @@ -589,49 +625,120 @@ vddk_open (int readonly) goto err1; } - flags = 0; + h->flags = 0; if (readonly) - flags |= VIXDISKLIB_FLAG_OPEN_READ_ONLY; + h->flags |= VIXDISKLIB_FLAG_OPEN_READ_ONLY; if (single_link) - flags |= VIXDISKLIB_FLAG_OPEN_SINGLE_LINK; + h->flags |= VIXDISKLIB_FLAG_OPEN_SINGLE_LINK; if (unbuffered) - flags |= VIXDISKLIB_FLAG_OPEN_UNBUFFERED; - - DEBUG_CALL ("VixDiskLib_Open", - "connection, %s, %d, &handle", filename, flags); - err = VixDiskLib_Open (h->connection, filename, flags, &h->handle); - if (err != VIX_OK) { - VDDK_ERROR (err, "VixDiskLib_Open: %s", filename); - goto err2; - } - - nbdkit_debug ("transport mode: %s", - VixDiskLib_GetTransportMode (h->handle)); + h->flags |= VIXDISKLIB_FLAG_OPEN_UNBUFFERED; return h; - err2: - DEBUG_CALL ("VixDiskLib_Disconnect", "connection"); - VixDiskLib_Disconnect (h->connection); err1: free_connect_params (h->params); err0: + free (h->vddk_handles.ptr); + pthread_cond_destroy (&h->vddk_handles_cond); + pthread_mutex_destroy (&h->vddk_handles_lock); free (h); return NULL; } +/* Get a VDDK handle on demand. */ +static VixDiskLibHandle +open_vddk_handle (struct handle *h) +{ + ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&open_close_lock); + VixDiskLibHandle vddk_handle; + VixError err; + + DEBUG_CALL ("VixDiskLib_Open", + "connection, %s, %d, &handle", filename, h->flags); + err = VixDiskLib_Open (h->connection, filename, h->flags, &vddk_handle); + if (err != VIX_OK) { + VDDK_ERROR (err, "VixDiskLib_Open: %s", filename); + return NULL; + } + + nbdkit_debug ("transport mode: %s", + VixDiskLib_GetTransportMode (vddk_handle)); + return vddk_handle; +} + +static struct vddk_handle * +get_vddk_handle (struct handle *h) +{ + const unsigned max = h->readonly ? pool_max : 1; + ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&h->vddk_handles_lock); + VixDiskLibHandle vddk_handle; + size_t i; + + again: + /* See if there's a handle in the pool which is not in use. */ + for (i = 0; i < h->vddk_handles.size; ++i) { + if (!h->vddk_handles.ptr[i].in_use) { + h->vddk_handles.ptr[i].in_use = true; + return &h->vddk_handles.ptr[i]; + } + } + + /* If the pool is too big we have to wait for another thread to + * finish using its handle and try again. + */ + if (h->vddk_handles.size >= max) { + pthread_cond_wait (&h->vddk_handles_cond, &h->vddk_handles_lock); + goto again; + } + + /* Open another handle and add it to the pool. Note that + * vddk_handles_append cannot fail because we reserved space in + * vddk_open. + */ + vddk_handle = open_vddk_handle (h); + if (vddk_handle == NULL) + return NULL; + vddk_handles_append (&h->vddk_handles, + (struct vddk_handle){ vddk_handle, true, h }); + return &h->vddk_handles.ptr[h->vddk_handles.size-1]; +} + +static void +put_vddk_handle (struct vddk_handle **p) +{ + if (*p) { + ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&(*p)->h->vddk_handles_lock); + assert ((*p)->in_use); + (*p)->in_use = false; + pthread_cond_signal (&(*p)->h->vddk_handles_cond); + } +} + +/* Wrap get/put_vddk_handle in nicer macro. */ +#define GET_VDDK_HANDLE_FOR_CURRENT_SCOPE(h, name) \ + __attribute__((cleanup (put_vddk_handle))) \ + struct vddk_handle *name##_h = get_vddk_handle (h); \ + if (name##_h == NULL) return -1; \ + VixDiskLibHandle name = name##_h->vddk_handle + /* Free up the per-connection handle. */ static void vddk_close (void *handle) { ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&open_close_lock); - struct vddk_handle *h = handle; + struct handle *h = handle; + size_t i; - DEBUG_CALL ("VixDiskLib_Close", "handle"); - VixDiskLib_Close (h->handle); + for (i = 0; i < h->vddk_handles.size; ++i) { + DEBUG_CALL ("VixDiskLib_Close", "handle"); + VixDiskLib_Close (h->vddk_handles.ptr[i].vddk_handle); + } + free (h->vddk_handles.ptr); DEBUG_CALL ("VixDiskLib_Disconnect", "connection"); VixDiskLib_Disconnect (h->connection); free_connect_params (h->params); + pthread_cond_destroy (&h->vddk_handles_cond); + pthread_mutex_destroy (&h->vddk_handles_lock); free (h); } @@ -639,13 +746,14 @@ vddk_close (void *handle) static int64_t vddk_get_size (void *handle) { - struct vddk_handle *h = handle; + struct handle *h = handle; + GET_VDDK_HANDLE_FOR_CURRENT_SCOPE (h, vddk_handle); VixDiskLibInfo *info; VixError err; uint64_t size; DEBUG_CALL ("VixDiskLib_GetInfo", "handle, &info"); - err = VixDiskLib_GetInfo (h->handle, &info); + err = VixDiskLib_GetInfo (vddk_handle, &info); if (err != VIX_OK) { VDDK_ERROR (err, "VixDiskLib_GetInfo"); return -1; @@ -687,7 +795,8 @@ static int vddk_pread (void *handle, void *buf, uint32_t count, uint64_t offset, uint32_t flags) { - struct vddk_handle *h = handle; + struct handle *h = handle; + GET_VDDK_HANDLE_FOR_CURRENT_SCOPE (h, vddk_handle); VixError err; /* Align to sectors. */ @@ -706,7 +815,7 @@ vddk_pread (void *handle, void *buf, uint32_t count, uint64_t offset, "handle, %" PRIu64 " sectors, " "%" PRIu32 " sectors, buffer", offset, count); - err = VixDiskLib_Read (h->handle, offset, count, buf); + err = VixDiskLib_Read (vddk_handle, offset, count, buf); if (err != VIX_OK) { VDDK_ERROR (err, "VixDiskLib_Read"); return -1; @@ -726,7 +835,8 @@ vddk_pwrite (void *handle, const void *buf, uint32_t count, uint64_t offset, uint32_t flags) { const bool fua = flags & NBDKIT_FLAG_FUA; - struct vddk_handle *h = handle; + struct handle *h = handle; + GET_VDDK_HANDLE_FOR_CURRENT_SCOPE (h, vddk_handle); VixError err; /* Align to sectors. */ @@ -745,7 +855,7 @@ vddk_pwrite (void *handle, const void *buf, uint32_t count, uint64_t offset, "handle, %" PRIu64 " sectors, " "%" PRIu32 " sectors, buffer", offset, count); - err = VixDiskLib_Write (h->handle, offset, count, buf); + err = VixDiskLib_Write (vddk_handle, offset, count, buf); if (err != VIX_OK) { VDDK_ERROR (err, "VixDiskLib_Write"); return -1; @@ -761,7 +871,8 @@ vddk_pwrite (void *handle, const void *buf, uint32_t count, uint64_t offset, static int vddk_flush (void *handle, uint32_t flags) { - struct vddk_handle *h = handle; + struct handle *h = handle; + GET_VDDK_HANDLE_FOR_CURRENT_SCOPE (h, vddk_handle); VixError err; /* The Flush call was not available in VDDK < 6.0 so this is simply @@ -771,7 +882,7 @@ vddk_flush (void *handle, uint32_t flags) return 0; DEBUG_CALL ("VixDiskLib_Flush", "handle"); - err = VixDiskLib_Flush (h->handle); + err = VixDiskLib_Flush (vddk_handle); if (err != VIX_OK) { VDDK_ERROR (err, "VixDiskLib_Flush"); return -1; @@ -783,7 +894,8 @@ vddk_flush (void *handle, uint32_t flags) static int vddk_can_extents (void *handle) { - struct vddk_handle *h = handle; + struct handle *h = handle; + GET_VDDK_HANDLE_FOR_CURRENT_SCOPE (h, vddk_handle); VixError err; VixDiskLibBlockList *block_list; @@ -808,7 +920,7 @@ vddk_can_extents (void *handle) DEBUG_CALL ("VixDiskLib_QueryAllocatedBlocks", "handle, 0, %d sectors, %d sectors", VIXDISKLIB_MIN_CHUNK_SIZE, VIXDISKLIB_MIN_CHUNK_SIZE); - err = VixDiskLib_QueryAllocatedBlocks (h->handle, + err = VixDiskLib_QueryAllocatedBlocks (vddk_handle, 0, VIXDISKLIB_MIN_CHUNK_SIZE, VIXDISKLIB_MIN_CHUNK_SIZE, &block_list); @@ -864,7 +976,8 @@ static int vddk_extents (void *handle, uint32_t count, uint64_t offset, uint32_t flags, struct nbdkit_extents *extents) { - struct vddk_handle *h = handle; + struct handle *h = handle; + GET_VDDK_HANDLE_FOR_CURRENT_SCOPE (h, vddk_handle); bool req_one = flags & NBDKIT_FLAG_REQ_ONE; uint64_t position, end, start_sector; @@ -896,7 +1009,7 @@ vddk_extents (void *handle, uint32_t count, uint64_t offset, uint32_t flags, "handle, %" PRIu64 " sectors, %" PRIu64 " sectors, " "%d sectors", start_sector, nr_sectors, VIXDISKLIB_MIN_CHUNK_SIZE); - err = VixDiskLib_QueryAllocatedBlocks (h->handle, + err = VixDiskLib_QueryAllocatedBlocks (vddk_handle, start_sector, nr_sectors, VIXDISKLIB_MIN_CHUNK_SIZE, &block_list); -- 2.27.0
Richard W.M. Jones
2020-Aug-06 14:35 UTC
Re: [Libguestfs] [PATCH nbdkit NOT WORKING 0/2] vddk: Relax threading model.
Even running this with lots of extra debugging it seems to be doing what is expected. I can't see the bug if there is one. Note I'm only testing qemu-img convert as that is what's relevant to virt-v2v. Previously I was using a hand-written test using libnbd that did random reads across the disk, and showed a modest improvement with 8 handles. Here are the results across a range of pool sizes, all with -W -m 16: 1 handle: real 1m8.031s user 0m0.112s sys 0m1.560s 2 handles: real 1m6.465s user 0m0.106s sys 0m1.607s 4 handles: real 1m21.488s user 0m0.126s sys 0m1.620s 8 handles: real 1m27.790s user 0m0.099s sys 0m1.625s 16 handles: real 1m33.974s user 0m0.124s sys 0m1.718s I also tried matching the number of coroutines to the number of handles in the pool (ie pool-max == -m): 1 coroutine, 1 handle: real 1m9.545s user 0m0.083s sys 0m1.592s 2 coroutines, 2 handles: real 1m6.130s user 0m0.078s sys 0m1.567s 4 coroutines, 4 handles: real 1m22.109s user 0m0.107s sys 0m1.690s 8 coroutines, 8 handles: real 1m26.490s user 0m0.108s sys 0m1.650s 16 coroutines, 16 handles (same as last result above): real 1m33.974s user 0m0.124s sys 0m1.718s Rich. -- Richard Jones, Virtualization Group, Red Hat http://people.redhat.com/~rjones Read my programming and virtualization blog: http://rwmj.wordpress.com Fedora Windows cross-compiler. Compile Windows programs, test, and build Windows installers. Over 100 libraries supported. http://fedoraproject.org/wiki/MinGW
Nir Soffer
2020-Aug-06 15:31 UTC
Re: [Libguestfs] [PATCH nbdkit 1/2] vddk: Relax threading model: SERIALIZE_ALL_REQUESTS -> SERIALIZE_REQUESTS.
On Thu, Aug 6, 2020, 16:16 Richard W.M. Jones <rjones@redhat.com> wrote:> See comment in code and > https://www.redhat.com/archives/libguestfs/2020-August/msg00023.html > --- > plugins/vddk/vddk.c | 17 +++++++++++++---- > 1 file changed, 13 insertions(+), 4 deletions(-) > > diff --git a/plugins/vddk/vddk.c b/plugins/vddk/vddk.c > index c24da96f..5926e181 100644 > --- a/plugins/vddk/vddk.c > +++ b/plugins/vddk/vddk.c > @@ -478,11 +478,18 @@ vddk_dump_plugin (void) > #endif > } > > -/* XXX To really do threading correctly in accordance with the VDDK > - * documentation, we must do all open/close calls from a single > - * thread. This is a huge pain. > +/* The rules on threads and VDDK are here: > + * > https://code.vmware.com/docs/11750/virtual-disk-development-kit-programming-guide/GUID-6BE903E8-DC70-46D9-98E4-E34A2002C2AD.html > + * > + * Before nbdkit 1.22 we used SERIALIZE_ALL_REQUESTS. Since nbdkit > + * 1.22 we changed this to SERIALIZE_REQUESTS and added a mutex around > + * calls to VixDiskLib_Open and VixDiskLib_Close. This is not quite > + * within the letter of the rules, but is within the spirit. >The document is very clear about using the same thread for open an close. Using a lock is not the same. I think Eric already wrote about this. */> -#define THREAD_MODEL NBDKIT_THREAD_MODEL_SERIALIZE_ALL_REQUESTS > +#define THREAD_MODEL NBDKIT_THREAD_MODEL_SERIALIZE_REQUESTS > + > +/* Lock protecting open/close calls - see above. */ > +static pthread_mutex_t open_close_lock = PTHREAD_MUTEX_INITIALIZER; > > /* The per-connection handle. */ > struct vddk_handle { > @@ -524,6 +531,7 @@ free_connect_params (VixDiskLibConnectParams *params) > static void * > vddk_open (int readonly) > { > + ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&open_close_lock); > struct vddk_handle *h; > VixError err; > uint32_t flags; > @@ -616,6 +624,7 @@ vddk_open (int readonly) > static void > vddk_close (void *handle) > { > + ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&open_close_lock); > struct vddk_handle *h = handle; > > DEBUG_CALL ("VixDiskLib_Close", "handle"); > -- > 2.27.0 > >
Nir Soffer
2020-Aug-06 15:46 UTC
Re: [Libguestfs] [PATCH nbdkit 2/2] vddk: Relax thread model to PARALLEL and implement a disk handle pool.
On Thu, Aug 6, 2020, 16:16 Richard W.M. Jones <rjones@redhat.com> wrote:> The pool is only used for readonly connections, since writable > connections usually take a lock on the server side and therefore you > cannot open more than one. > --- > plugins/vddk/nbdkit-vddk-plugin.pod | 7 + > plugins/vddk/vddk.c | 201 ++++++++++++++++++++++------ > 2 files changed, 164 insertions(+), 44 deletions(-) > > diff --git a/plugins/vddk/nbdkit-vddk-plugin.pod > b/plugins/vddk/nbdkit-vddk-plugin.pod > index e5539da9..288aed4b 100644 > --- a/plugins/vddk/nbdkit-vddk-plugin.pod > +++ b/plugins/vddk/nbdkit-vddk-plugin.pod > @@ -175,6 +175,13 @@ Read the password from file descriptor number C<FD>, > inherited from > the parent process when nbdkit starts up. This is also a secure > method to supply a password. > > +=item B<pool-max=>N > + > +To improve performance, for read-only connections (see I<-r> option) > +the plugin will open a pool of VixDiskLibHandle disk handles. You can > +use this option to control the maximum size of the pool. The default > +is 8. To disable this feature, set it to 0 or 1. > + > =item B<port=>PORT > > The port on the VCenter/ESXi host. Defaults to 443. > diff --git a/plugins/vddk/vddk.c b/plugins/vddk/vddk.c > index 5926e181..173d5031 100644 > --- a/plugins/vddk/vddk.c > +++ b/plugins/vddk/vddk.c > @@ -52,6 +52,7 @@ > #include "isaligned.h" > #include "minmax.h" > #include "rounding.h" > +#include "vector.h" > > #include "vddk.h" > #include "vddk-structs.h" > @@ -85,6 +86,7 @@ char *libdir; /* libdir */ > static uint16_t nfc_host_port; /* nfchostport */ > char *password; /* password */ > static uint16_t port; /* port */ > +static unsigned pool_max = 8; /* pool-max */ > static const char *server_name; /* server */ > static bool single_link; /* single-link */ > static const char *snapshot_moref; /* snapshot */ > @@ -233,6 +235,12 @@ vddk_config (const char *key, const char *value) > if (nbdkit_parse_uint16_t ("port", value, &port) == -1) > return -1; > } > + else if (strcmp (key, "pool-max") == 0) { > + if (nbdkit_parse_unsigned ("pool-max", value, &pool_max) == -1) > + return -1; > + if (pool_max < 1) > + pool_max = 1; > + } > else if (strcmp (key, "reexeced_") == 0) { > /* Special name because it is only for internal use. */ > reexeced = (char *)value; > @@ -482,20 +490,37 @@ vddk_dump_plugin (void) > * > https://code.vmware.com/docs/11750/virtual-disk-development-kit-programming-guide/GUID-6BE903E8-DC70-46D9-98E4-E34A2002C2AD.html > * > * Before nbdkit 1.22 we used SERIALIZE_ALL_REQUESTS. Since nbdkit > - * 1.22 we changed this to SERIALIZE_REQUESTS and added a mutex around > - * calls to VixDiskLib_Open and VixDiskLib_Close. This is not quite > - * within the letter of the rules, but is within the spirit. > + * 1.22 we changed this to PARALLEL, added a mutex around calls to > + * VixDiskLib_Open and VixDiskLib_Close, and use a pool of disk > + * handles. This is not quite within the letter of the rules, but is > + * within the spirit. > */ > -#define THREAD_MODEL NBDKIT_THREAD_MODEL_SERIALIZE_REQUESTS > +#define THREAD_MODEL NBDKIT_THREAD_MODEL_PARALLEL > > /* Lock protecting open/close calls - see above. */ > static pthread_mutex_t open_close_lock = PTHREAD_MUTEX_INITIALIZER; > > -/* The per-connection handle. */ > +struct handle; > struct vddk_handle { > + VixDiskLibHandle vddk_handle; > + bool in_use; > + struct handle *h; > +}; > +DEFINE_VECTOR_TYPE(vddk_handles, struct vddk_handle) > + > +/* The per-connection handle. */ > +struct handle { > VixDiskLibConnectParams *params; /* connection parameters */ > VixDiskLibConnection connection; /* connection */ >Given the poor results, I suspect that that handles created using same connection share a lock. This also makes sense if connection abstract a blocking socket. With multiple nbd connections we got 60% improvement. I expect to see similar results if we use multiple connection+handle pairs. Can you try to move the connection into the vddk_handle struct? - VixDiskLibHandle handle; /* disk handle */> + int readonly; /* readonly flag for this connection */ > + uint32_t flags; /* open flags */ > + > + /* Pool of VDDK disk handles. Do not access this directly, use > + * GET_VDDK_HANDLE_FOR_CURRENT_SCOPE macro to get a free handle. > + */ > + pthread_mutex_t vddk_handles_lock; > + pthread_cond_t vddk_handles_cond; > + vddk_handles vddk_handles; > }; > > static inline VixDiskLibConnectParams * > @@ -531,17 +556,28 @@ free_connect_params (VixDiskLibConnectParams *params) > static void * > vddk_open (int readonly) > { > - ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&open_close_lock); > - struct vddk_handle *h; > + struct handle *h; > VixError err; > - uint32_t flags; > > - h = malloc (sizeof *h); > + h = calloc (1, sizeof *h); > if (h == NULL) { > - nbdkit_error ("malloc: %m"); > + nbdkit_error ("calloc: %m"); > return NULL; > } > > + h->readonly = readonly; > + pthread_mutex_init (&h->vddk_handles_lock, NULL); > + pthread_cond_init (&h->vddk_handles_cond, NULL); > + > + /* We have to reserve this vector to ensure that it is not > + * reallocated, as that would make the pointer returned by > + * get_vddk_handle in another thread invalid. > + */ > + if (vddk_handles_reserve (&h->vddk_handles, pool_max) == -1) { > + nbdkit_error ("realloc: %m"); > + goto err0; > + } > + > h->params = allocate_connect_params (); > if (h->params == NULL) { > nbdkit_error ("allocate VixDiskLibConnectParams: %m"); > @@ -589,49 +625,120 @@ vddk_open (int readonly) > goto err1; > } > > - flags = 0; > + h->flags = 0; > if (readonly) > - flags |= VIXDISKLIB_FLAG_OPEN_READ_ONLY; > + h->flags |= VIXDISKLIB_FLAG_OPEN_READ_ONLY; > if (single_link) > - flags |= VIXDISKLIB_FLAG_OPEN_SINGLE_LINK; > + h->flags |= VIXDISKLIB_FLAG_OPEN_SINGLE_LINK; > if (unbuffered) > - flags |= VIXDISKLIB_FLAG_OPEN_UNBUFFERED; > - > - DEBUG_CALL ("VixDiskLib_Open", > - "connection, %s, %d, &handle", filename, flags); > - err = VixDiskLib_Open (h->connection, filename, flags, &h->handle); > - if (err != VIX_OK) { > - VDDK_ERROR (err, "VixDiskLib_Open: %s", filename); > - goto err2; > - } > - > - nbdkit_debug ("transport mode: %s", > - VixDiskLib_GetTransportMode (h->handle)); > + h->flags |= VIXDISKLIB_FLAG_OPEN_UNBUFFERED; > > return h; > > - err2: > - DEBUG_CALL ("VixDiskLib_Disconnect", "connection"); > - VixDiskLib_Disconnect (h->connection); > err1: > free_connect_params (h->params); > err0: > + free (h->vddk_handles.ptr); > + pthread_cond_destroy (&h->vddk_handles_cond); > + pthread_mutex_destroy (&h->vddk_handles_lock); > free (h); > return NULL; > } > > +/* Get a VDDK handle on demand. */ > +static VixDiskLibHandle > +open_vddk_handle (struct handle *h) > +{ > + ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&open_close_lock); > + VixDiskLibHandle vddk_handle; > + VixError err; > + > + DEBUG_CALL ("VixDiskLib_Open", > + "connection, %s, %d, &handle", filename, h->flags); > + err = VixDiskLib_Open (h->connection, filename, h->flags, &vddk_handle); > + if (err != VIX_OK) { > + VDDK_ERROR (err, "VixDiskLib_Open: %s", filename); > + return NULL; > + } > + > + nbdkit_debug ("transport mode: %s", > + VixDiskLib_GetTransportMode (vddk_handle)); > + return vddk_handle; > +} > + > +static struct vddk_handle * > +get_vddk_handle (struct handle *h) > +{ > + const unsigned max = h->readonly ? pool_max : 1; > + ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&h->vddk_handles_lock); > + VixDiskLibHandle vddk_handle; > + size_t i; > + > + again: > + /* See if there's a handle in the pool which is not in use. */ > + for (i = 0; i < h->vddk_handles.size; ++i) { > + if (!h->vddk_handles.ptr[i].in_use) { > + h->vddk_handles.ptr[i].in_use = true; > + return &h->vddk_handles.ptr[i]; > + } > + } > + > + /* If the pool is too big we have to wait for another thread to > + * finish using its handle and try again. > + */ > + if (h->vddk_handles.size >= max) { > + pthread_cond_wait (&h->vddk_handles_cond, &h->vddk_handles_lock); > + goto again; > + } > + > + /* Open another handle and add it to the pool. Note that > + * vddk_handles_append cannot fail because we reserved space in > + * vddk_open. > + */ > + vddk_handle = open_vddk_handle (h); > + if (vddk_handle == NULL) > + return NULL; > + vddk_handles_append (&h->vddk_handles, > + (struct vddk_handle){ vddk_handle, true, h }); > + return &h->vddk_handles.ptr[h->vddk_handles.size-1]; > +} > + > +static void > +put_vddk_handle (struct vddk_handle **p) > +{ > + if (*p) { > + ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&(*p)->h->vddk_handles_lock); > + assert ((*p)->in_use); > + (*p)->in_use = false; > + pthread_cond_signal (&(*p)->h->vddk_handles_cond); > + } > +} > + > +/* Wrap get/put_vddk_handle in nicer macro. */ > +#define GET_VDDK_HANDLE_FOR_CURRENT_SCOPE(h, name) \ > + __attribute__((cleanup (put_vddk_handle))) \ > + struct vddk_handle *name##_h = get_vddk_handle (h); \ > + if (name##_h == NULL) return -1; \ > + VixDiskLibHandle name = name##_h->vddk_handle > + > /* Free up the per-connection handle. */ > static void > vddk_close (void *handle) > { > ACQUIRE_LOCK_FOR_CURRENT_SCOPE (&open_close_lock); > - struct vddk_handle *h = handle; > + struct handle *h = handle; > + size_t i; > > - DEBUG_CALL ("VixDiskLib_Close", "handle"); > - VixDiskLib_Close (h->handle); > + for (i = 0; i < h->vddk_handles.size; ++i) { > + DEBUG_CALL ("VixDiskLib_Close", "handle"); > + VixDiskLib_Close (h->vddk_handles.ptr[i].vddk_handle); > + } > + free (h->vddk_handles.ptr); > DEBUG_CALL ("VixDiskLib_Disconnect", "connection"); > VixDiskLib_Disconnect (h->connection); > free_connect_params (h->params); > + pthread_cond_destroy (&h->vddk_handles_cond); > + pthread_mutex_destroy (&h->vddk_handles_lock); > free (h); > } > > @@ -639,13 +746,14 @@ vddk_close (void *handle) > static int64_t > vddk_get_size (void *handle) > { > - struct vddk_handle *h = handle; > + struct handle *h = handle; > + GET_VDDK_HANDLE_FOR_CURRENT_SCOPE (h, vddk_handle); > VixDiskLibInfo *info; > VixError err; > uint64_t size; > > DEBUG_CALL ("VixDiskLib_GetInfo", "handle, &info"); > - err = VixDiskLib_GetInfo (h->handle, &info); > + err = VixDiskLib_GetInfo (vddk_handle, &info); > if (err != VIX_OK) { > VDDK_ERROR (err, "VixDiskLib_GetInfo"); > return -1; > @@ -687,7 +795,8 @@ static int > vddk_pread (void *handle, void *buf, uint32_t count, uint64_t offset, > uint32_t flags) > { > - struct vddk_handle *h = handle; > + struct handle *h = handle; > + GET_VDDK_HANDLE_FOR_CURRENT_SCOPE (h, vddk_handle); > VixError err; > > /* Align to sectors. */ > @@ -706,7 +815,7 @@ vddk_pread (void *handle, void *buf, uint32_t count, > uint64_t offset, > "handle, %" PRIu64 " sectors, " > "%" PRIu32 " sectors, buffer", > offset, count); > - err = VixDiskLib_Read (h->handle, offset, count, buf); > + err = VixDiskLib_Read (vddk_handle, offset, count, buf); > if (err != VIX_OK) { > VDDK_ERROR (err, "VixDiskLib_Read"); > return -1; > @@ -726,7 +835,8 @@ vddk_pwrite (void *handle, const void *buf, uint32_t > count, uint64_t offset, > uint32_t flags) > { > const bool fua = flags & NBDKIT_FLAG_FUA; > - struct vddk_handle *h = handle; > + struct handle *h = handle; > + GET_VDDK_HANDLE_FOR_CURRENT_SCOPE (h, vddk_handle); > VixError err; > > /* Align to sectors. */ > @@ -745,7 +855,7 @@ vddk_pwrite (void *handle, const void *buf, uint32_t > count, uint64_t offset, > "handle, %" PRIu64 " sectors, " > "%" PRIu32 " sectors, buffer", > offset, count); > - err = VixDiskLib_Write (h->handle, offset, count, buf); > + err = VixDiskLib_Write (vddk_handle, offset, count, buf); > if (err != VIX_OK) { > VDDK_ERROR (err, "VixDiskLib_Write"); > return -1; > @@ -761,7 +871,8 @@ vddk_pwrite (void *handle, const void *buf, uint32_t > count, uint64_t offset, > static int > vddk_flush (void *handle, uint32_t flags) > { > - struct vddk_handle *h = handle; > + struct handle *h = handle; > + GET_VDDK_HANDLE_FOR_CURRENT_SCOPE (h, vddk_handle); > VixError err; > > /* The Flush call was not available in VDDK < 6.0 so this is simply > @@ -771,7 +882,7 @@ vddk_flush (void *handle, uint32_t flags) > return 0; > > DEBUG_CALL ("VixDiskLib_Flush", "handle"); > - err = VixDiskLib_Flush (h->handle); > + err = VixDiskLib_Flush (vddk_handle); > if (err != VIX_OK) { > VDDK_ERROR (err, "VixDiskLib_Flush"); > return -1; > @@ -783,7 +894,8 @@ vddk_flush (void *handle, uint32_t flags) > static int > vddk_can_extents (void *handle) > { > - struct vddk_handle *h = handle; > + struct handle *h = handle; > + GET_VDDK_HANDLE_FOR_CURRENT_SCOPE (h, vddk_handle); > VixError err; > VixDiskLibBlockList *block_list; > > @@ -808,7 +920,7 @@ vddk_can_extents (void *handle) > DEBUG_CALL ("VixDiskLib_QueryAllocatedBlocks", > "handle, 0, %d sectors, %d sectors", > VIXDISKLIB_MIN_CHUNK_SIZE, VIXDISKLIB_MIN_CHUNK_SIZE); > - err = VixDiskLib_QueryAllocatedBlocks (h->handle, > + err = VixDiskLib_QueryAllocatedBlocks (vddk_handle, > 0, VIXDISKLIB_MIN_CHUNK_SIZE, > VIXDISKLIB_MIN_CHUNK_SIZE, > &block_list); > @@ -864,7 +976,8 @@ static int > vddk_extents (void *handle, uint32_t count, uint64_t offset, uint32_t > flags, > struct nbdkit_extents *extents) > { > - struct vddk_handle *h = handle; > + struct handle *h = handle; > + GET_VDDK_HANDLE_FOR_CURRENT_SCOPE (h, vddk_handle); > bool req_one = flags & NBDKIT_FLAG_REQ_ONE; > uint64_t position, end, start_sector; > > @@ -896,7 +1009,7 @@ vddk_extents (void *handle, uint32_t count, uint64_t > offset, uint32_t flags, > "handle, %" PRIu64 " sectors, %" PRIu64 " sectors, " > "%d sectors", > start_sector, nr_sectors, VIXDISKLIB_MIN_CHUNK_SIZE); > - err = VixDiskLib_QueryAllocatedBlocks (h->handle, > + err = VixDiskLib_QueryAllocatedBlocks (vddk_handle, > start_sector, nr_sectors, > VIXDISKLIB_MIN_CHUNK_SIZE, > &block_list); > -- > 2.27.0 > >
Apparently Analagous Threads
- [PATCH nbdkit 2/2] vddk: Relax thread model to PARALLEL and implement a disk handle pool.
- [nbdkit PATCH 1/3] vddk: Use a separate handle for single-link=true
- [PATCH nbdkit NOT WORKING 0/2] vddk: Relax threading model.
- [PATCH nbdkit 7/8] vddk: Implement extents.
- [PATCH nbdkit] vddk: Relax threading model and enable multi-conn.