[libvirt] [PATCH v2 5/5] vz: handle gracefully races on undefining domain

Nikolay Shirokovskiy nshirokovskiy at virtuozzo.com
Wed Jul 20 15:00:34 UTC 2016


  This patch is not critical but nice to have. The original motivation
was error message in logs on undefining domain thru vz driver.
Undefine procedure drops domain lock while waiting for detaching
disks vz sdk call. Meanwhile vz sdk event domain-config-changed
arrives, its handler finds domain and is blocked waiting for job
condition. After undefine API call finishes event processing procedes
and tries to refreshes domain config thru existing vz sdk domain handle.
Domain does not exists anymore and event processing fails. Everything
is fine we just don't want to see error message in log for this
particular case.

  Fortunately domain has flag that domain is removed from list. This
also imply that vz sdk domain is also undefined. Thus if we check
for this flag right after domain is locked again on accuiring
job condition we gracefully handle this situation.

  Actually the race can happen in other situations too. Any
time we wait for job condition in mutualy exclusive job in
time when we acquire it vz sdk domain can cease to exist.
So instead of general internal error we can return domain
not found which is easier to handle. We don't need to patch
other places in mutually exclusive jobs where domain lock
is dropped as if job is started domain can't be undefine
by mutually exclusive undefine job.

  The code of this patch is quite similar to qemu driver checks
for is domain is active after acquiring a job. The difference
only while qemu domain is operational while process is active
vz domain is operational while domain exists.
---
 src/vz/vz_driver.c | 49 +++++++++++++++++++++++++++++++++++++++++++++++++
 src/vz/vz_sdk.c    | 13 +++++++++++++
 2 files changed, 62 insertions(+)

diff --git a/src/vz/vz_driver.c b/src/vz/vz_driver.c
index ce43d1b..3431455 100644
--- a/src/vz/vz_driver.c
+++ b/src/vz/vz_driver.c
@@ -714,6 +714,22 @@ vzDomainGetAutostart(virDomainPtr domain, int *autostart)
     return 0;
 }
 
+static int
+vzEnsureDomainExists(virDomainObjPtr dom)
+{
+    char uuidstr[VIR_UUID_STRING_BUFLEN];
+
+    if (!dom->removing)
+        return 0;
+
+    virUUIDFormat(dom->def->uuid, uuidstr);
+    virReportError(VIR_ERR_NO_DOMAIN,
+                   _("no domain with matching uuid '%s' (%s)"),
+                   uuidstr, dom->def->name);
+
+    return -1;
+}
+
 static virDomainPtr
 vzDomainDefineXMLFlags(virConnectPtr conn, const char *xml, unsigned int flags)
 {
@@ -780,6 +796,9 @@ vzDomainDefineXMLFlags(virConnectPtr conn, const char *xml, unsigned int flags)
                 goto cleanup;
             job = true;
 
+            if (vzEnsureDomainExists(dom) < 0)
+                goto cleanup;
+
             if (prlsdkApplyConfig(driver, dom, def))
                 goto cleanup;
 
@@ -1010,6 +1029,9 @@ vzDomainUndefineFlags(virDomainPtr domain,
         goto cleanup;
     job = true;
 
+    if (vzEnsureDomainExists(dom) < 0)
+        goto cleanup;
+
     ret = prlsdkUnregisterDomain(privconn->driver, dom, flags);
 
  cleanup:
@@ -1066,6 +1088,9 @@ vzDomainManagedSave(virDomainPtr domain, unsigned int flags)
         goto cleanup;
     job = true;
 
+    if (vzEnsureDomainExists(dom) < 0)
+        goto cleanup;
+
     state = virDomainObjGetState(dom, &reason);
 
     if (state == VIR_DOMAIN_RUNNING && (flags & VIR_DOMAIN_SAVE_PAUSED)) {
@@ -1157,6 +1182,9 @@ static int vzDomainAttachDeviceFlags(virDomainPtr domain, const char *xml,
         goto cleanup;
     job = true;
 
+    if (vzEnsureDomainExists(dom) < 0)
+        goto cleanup;
+
     if (prlsdkAttachDevice(driver, dom, dev) < 0)
         goto cleanup;
 
@@ -1206,6 +1234,9 @@ static int vzDomainDetachDeviceFlags(virDomainPtr domain, const char *xml,
         goto cleanup;
     job = true;
 
+    if (vzEnsureDomainExists(dom) < 0)
+        goto cleanup;
+
     if (prlsdkDetachDevice(driver, dom, dev) < 0)
         goto cleanup;
 
@@ -1243,6 +1274,9 @@ vzDomainSetUserPassword(virDomainPtr domain,
         goto cleanup;
     job = true;
 
+    if (vzEnsureDomainExists(dom) < 0)
+        goto cleanup;
+
     ret = prlsdkDomainSetUserPassword(dom, user, password);
 
  cleanup:
@@ -1281,6 +1315,9 @@ static int vzDomainUpdateDeviceFlags(virDomainPtr domain,
         goto cleanup;
     job = true;
 
+    if (vzEnsureDomainExists(dom) < 0)
+        goto cleanup;
+
     if (prlsdkUpdateDevice(driver, dom, dev) < 0)
         goto cleanup;
 
@@ -1619,6 +1656,9 @@ static int vzDomainSetMemoryFlagsImpl(virDomainPtr domain, unsigned long memory,
         goto cleanup;
     job = true;
 
+    if (vzEnsureDomainExists(dom) < 0)
+        goto cleanup;
+
     ret = prlsdkSetMemsize(dom, memory >> 10);
 
  cleanup:
@@ -2103,6 +2143,9 @@ vzDomainSnapshotCreateXML(virDomainPtr domain,
         goto cleanup;
     job = true;
 
+    if (vzEnsureDomainExists(dom) < 0)
+        goto cleanup;
+
     /* snaphot name is ignored, it will be set to auto generated by sdk uuid */
     if (prlsdkCreateSnapshot(dom, def->description) < 0)
         goto cleanup;
@@ -2164,6 +2207,9 @@ vzDomainRevertToSnapshot(virDomainSnapshotPtr snapshot, unsigned int flags)
         goto cleanup;
     job = true;
 
+    if (vzEnsureDomainExists(dom) < 0)
+        goto cleanup;
+
     ret = prlsdkSwitchToSnapshot(dom, snapshot->name,
                                  flags & VIR_DOMAIN_SNAPSHOT_REVERT_PAUSED);
  cleanup:
@@ -2534,6 +2580,9 @@ vzDomainMigratePerformStep(virDomainPtr domain,
         goto cleanup;
     job = true;
 
+    if (vzEnsureDomainExists(dom) < 0)
+        goto cleanup;
+
     if (!(vzuri = vzParseVzURI(miguri)))
         goto cleanup;
 
diff --git a/src/vz/vz_sdk.c b/src/vz/vz_sdk.c
index 5c2a6c5..38254c0 100644
--- a/src/vz/vz_sdk.c
+++ b/src/vz/vz_sdk.c
@@ -2067,6 +2067,9 @@ prlsdkHandleVmConfigEvent(vzDriverPtr driver,
         goto cleanup;
     job = true;
 
+    if (dom->removing)
+        goto cleanup;
+
     if (prlsdkUpdateDomain(driver, dom) < 0)
         goto cleanup;
 
@@ -2333,6 +2336,16 @@ prlsdkDomainChangeState(virDomainPtr domain,
         goto cleanup;
     job = true;
 
+    if (dom->removing) {
+        char uuidstr[VIR_UUID_STRING_BUFLEN];
+
+        virUUIDFormat(dom->def->uuid, uuidstr);
+        virReportError(VIR_ERR_NO_DOMAIN,
+                       _("no domain with matching uuid '%s' (%s)"),
+                       uuidstr, dom->def->name);
+        goto cleanup;
+    }
+
     ret = prlsdkDomainChangeStateLocked(privconn->driver, dom, chstate);
 
  cleanup:
-- 
1.8.3.1




More information about the libvir-list mailing list