From b999ce97f391d90ec41ea8426526392de5543fe9 Mon Sep 17 00:00:00 2001 From: Nikolay Shirokovskiy Date: Wed, 20 Jul 2016 18:00:34 +0300 Subject: [PATCH] vz: handle gracefully races on undefining domain Undefine procedure drops domain lock while waiting for detaching disks vz sdk call. Meanwhile vz sdk event domain-config-changed arrives, its handler finds domain and is blocked waiting for job condition. After undefine API call finishes event processing procedes and tries to refreshes domain config thru existing vz sdk domain handle. Domain does not exists anymore and event processing fails. Everything is fine we just don't want to see error message in log for this particular case. Fortunately domain has flag that domain is removed from list. This also imply that vz sdk domain is also undefined. Thus if we check for this flag right after domain is locked again on accuiring job condition we gracefully handle this situation. Actually the race can happen in other situations too. Any time we wait for job condition in mutualy exclusive job in time when we acquire it vz sdk domain can cease to exist. So instead of general internal error we can return domain not found which is easier to handle. We don't need to patch other places in mutually exclusive jobs where domain lock is dropped as if job is started domain can't be undefine by mutually exclusive undefine job. The code of this patch is quite similar to qemu driver checks for is domain is active after acquiring a job. The difference only while qemu domain is operational while process is active vz domain is operational while domain exists. --- src/vz/vz_driver.c | 49 ++++++++++++++++++++++++++++++++++++++++++++++ src/vz/vz_sdk.c | 13 ++++++++++++ 2 files changed, 62 insertions(+) diff --git a/src/vz/vz_driver.c b/src/vz/vz_driver.c index ce43d1b963..343145510a 100644 --- a/src/vz/vz_driver.c +++ b/src/vz/vz_driver.c @@ -714,6 +714,22 @@ vzDomainGetAutostart(virDomainPtr domain, int *autostart) return 0; } +static int +vzEnsureDomainExists(virDomainObjPtr dom) +{ + char uuidstr[VIR_UUID_STRING_BUFLEN]; + + if (!dom->removing) + return 0; + + virUUIDFormat(dom->def->uuid, uuidstr); + virReportError(VIR_ERR_NO_DOMAIN, + _("no domain with matching uuid '%s' (%s)"), + uuidstr, dom->def->name); + + return -1; +} + static virDomainPtr vzDomainDefineXMLFlags(virConnectPtr conn, const char *xml, unsigned int flags) { @@ -780,6 +796,9 @@ vzDomainDefineXMLFlags(virConnectPtr conn, const char *xml, unsigned int flags) goto cleanup; job = true; + if (vzEnsureDomainExists(dom) < 0) + goto cleanup; + if (prlsdkApplyConfig(driver, dom, def)) goto cleanup; @@ -1010,6 +1029,9 @@ vzDomainUndefineFlags(virDomainPtr domain, goto cleanup; job = true; + if (vzEnsureDomainExists(dom) < 0) + goto cleanup; + ret = prlsdkUnregisterDomain(privconn->driver, dom, flags); cleanup: @@ -1066,6 +1088,9 @@ vzDomainManagedSave(virDomainPtr domain, unsigned int flags) goto cleanup; job = true; + if (vzEnsureDomainExists(dom) < 0) + goto cleanup; + state = virDomainObjGetState(dom, &reason); if (state == VIR_DOMAIN_RUNNING && (flags & VIR_DOMAIN_SAVE_PAUSED)) { @@ -1157,6 +1182,9 @@ static int vzDomainAttachDeviceFlags(virDomainPtr domain, const char *xml, goto cleanup; job = true; + if (vzEnsureDomainExists(dom) < 0) + goto cleanup; + if (prlsdkAttachDevice(driver, dom, dev) < 0) goto cleanup; @@ -1206,6 +1234,9 @@ static int vzDomainDetachDeviceFlags(virDomainPtr domain, const char *xml, goto cleanup; job = true; + if (vzEnsureDomainExists(dom) < 0) + goto cleanup; + if (prlsdkDetachDevice(driver, dom, dev) < 0) goto cleanup; @@ -1243,6 +1274,9 @@ vzDomainSetUserPassword(virDomainPtr domain, goto cleanup; job = true; + if (vzEnsureDomainExists(dom) < 0) + goto cleanup; + ret = prlsdkDomainSetUserPassword(dom, user, password); cleanup: @@ -1281,6 +1315,9 @@ static int vzDomainUpdateDeviceFlags(virDomainPtr domain, goto cleanup; job = true; + if (vzEnsureDomainExists(dom) < 0) + goto cleanup; + if (prlsdkUpdateDevice(driver, dom, dev) < 0) goto cleanup; @@ -1619,6 +1656,9 @@ static int vzDomainSetMemoryFlagsImpl(virDomainPtr domain, unsigned long memory, goto cleanup; job = true; + if (vzEnsureDomainExists(dom) < 0) + goto cleanup; + ret = prlsdkSetMemsize(dom, memory >> 10); cleanup: @@ -2103,6 +2143,9 @@ vzDomainSnapshotCreateXML(virDomainPtr domain, goto cleanup; job = true; + if (vzEnsureDomainExists(dom) < 0) + goto cleanup; + /* snaphot name is ignored, it will be set to auto generated by sdk uuid */ if (prlsdkCreateSnapshot(dom, def->description) < 0) goto cleanup; @@ -2164,6 +2207,9 @@ vzDomainRevertToSnapshot(virDomainSnapshotPtr snapshot, unsigned int flags) goto cleanup; job = true; + if (vzEnsureDomainExists(dom) < 0) + goto cleanup; + ret = prlsdkSwitchToSnapshot(dom, snapshot->name, flags & VIR_DOMAIN_SNAPSHOT_REVERT_PAUSED); cleanup: @@ -2534,6 +2580,9 @@ vzDomainMigratePerformStep(virDomainPtr domain, goto cleanup; job = true; + if (vzEnsureDomainExists(dom) < 0) + goto cleanup; + if (!(vzuri = vzParseVzURI(miguri))) goto cleanup; diff --git a/src/vz/vz_sdk.c b/src/vz/vz_sdk.c index 5c2a6c5961..38254c05e2 100644 --- a/src/vz/vz_sdk.c +++ b/src/vz/vz_sdk.c @@ -2067,6 +2067,9 @@ prlsdkHandleVmConfigEvent(vzDriverPtr driver, goto cleanup; job = true; + if (dom->removing) + goto cleanup; + if (prlsdkUpdateDomain(driver, dom) < 0) goto cleanup; @@ -2333,6 +2336,16 @@ prlsdkDomainChangeState(virDomainPtr domain, goto cleanup; job = true; + if (dom->removing) { + char uuidstr[VIR_UUID_STRING_BUFLEN]; + + virUUIDFormat(dom->def->uuid, uuidstr); + virReportError(VIR_ERR_NO_DOMAIN, + _("no domain with matching uuid '%s' (%s)"), + uuidstr, dom->def->name); + goto cleanup; + } + ret = prlsdkDomainChangeStateLocked(privconn->driver, dom, chstate); cleanup: