qemu_driver: Don't handle the EOF event if vm get restarted

Currently, libvirt creates a thread pool with only on thread to handle all
qemu monitor events for virtual machines, In the cases that if the thread
gets stuck while handling a monitor EOF event, such as unable to kill the
virtual machine process or release resources, the events of other virtual
machine will be also blocked, which will lead to the abnormal behavior of
other virtual machines.

For instance, when another virtual machine completes a shutdown operation
and the monitor EOF event has been queued but remains unprocessed, we
immediately destroy and start the virtual machine again, at a later time
when EOF event get processed, the processMonitorEOFEvent() will kill the
virtual machine that just started.

To address this issue, in the processMonitorEOFEvent(), we check whether
the current virtual machine's id is equal to the the one at the time
the event was generated. If they do not match, we immediately return.

Reviewed-by: Daniel P. Berrangé <berrange@redhat.com>
Signed-off-by: Guoyi Tu <tugy@chinatelecom.cn>
Signed-off-by: dengpengcheng <dengpc12@chinatelecom.cn>
This commit is contained in:
Guoyi Tu 2023-12-07 20:52:39 +08:00 committed by Daniel P. Berrangé
parent 392897d9b0
commit dd2f36d66e
3 changed files with 11 additions and 4 deletions

View File

@ -11470,7 +11470,6 @@ qemuProcessEventFree(struct qemuProcessEvent *event)
case QEMU_PROCESS_EVENT_NETDEV_STREAM_DISCONNECTED: case QEMU_PROCESS_EVENT_NETDEV_STREAM_DISCONNECTED:
case QEMU_PROCESS_EVENT_NIC_RX_FILTER_CHANGED: case QEMU_PROCESS_EVENT_NIC_RX_FILTER_CHANGED:
case QEMU_PROCESS_EVENT_SERIAL_CHANGED: case QEMU_PROCESS_EVENT_SERIAL_CHANGED:
case QEMU_PROCESS_EVENT_MONITOR_EOF:
case QEMU_PROCESS_EVENT_GUEST_CRASHLOADED: case QEMU_PROCESS_EVENT_GUEST_CRASHLOADED:
g_free(event->data); g_free(event->data);
break; break;
@ -11484,6 +11483,7 @@ qemuProcessEventFree(struct qemuProcessEvent *event)
case QEMU_PROCESS_EVENT_UNATTENDED_MIGRATION: case QEMU_PROCESS_EVENT_UNATTENDED_MIGRATION:
case QEMU_PROCESS_EVENT_RESET: case QEMU_PROCESS_EVENT_RESET:
case QEMU_PROCESS_EVENT_NBDKIT_EXITED: case QEMU_PROCESS_EVENT_NBDKIT_EXITED:
case QEMU_PROCESS_EVENT_MONITOR_EOF:
case QEMU_PROCESS_EVENT_LAST: case QEMU_PROCESS_EVENT_LAST:
break; break;
} }

View File

@ -3854,7 +3854,8 @@ processJobStatusChangeEvent(virDomainObj *vm,
static void static void
processMonitorEOFEvent(virQEMUDriver *driver, processMonitorEOFEvent(virQEMUDriver *driver,
virDomainObj *vm) virDomainObj *vm,
int domid)
{ {
qemuDomainObjPrivate *priv = vm->privateData; qemuDomainObjPrivate *priv = vm->privateData;
int eventReason = VIR_DOMAIN_EVENT_STOPPED_SHUTDOWN; int eventReason = VIR_DOMAIN_EVENT_STOPPED_SHUTDOWN;
@ -3863,6 +3864,12 @@ processMonitorEOFEvent(virQEMUDriver *driver,
unsigned int stopFlags = 0; unsigned int stopFlags = 0;
virObjectEvent *event = NULL; virObjectEvent *event = NULL;
if (vm->def->id != domid) {
VIR_DEBUG("Domain %s was restarted, ignoring EOF",
vm->def->name);
return;
}
if (qemuProcessBeginStopJob(vm, VIR_JOB_DESTROY, true) < 0) if (qemuProcessBeginStopJob(vm, VIR_JOB_DESTROY, true) < 0)
return; return;
@ -4082,7 +4089,7 @@ static void qemuProcessEventHandler(void *data, void *opaque)
processJobStatusChangeEvent(vm, processEvent->data); processJobStatusChangeEvent(vm, processEvent->data);
break; break;
case QEMU_PROCESS_EVENT_MONITOR_EOF: case QEMU_PROCESS_EVENT_MONITOR_EOF:
processMonitorEOFEvent(driver, vm); processMonitorEOFEvent(driver, vm, GPOINTER_TO_INT(processEvent->data));
break; break;
case QEMU_PROCESS_EVENT_PR_DISCONNECT: case QEMU_PROCESS_EVENT_PR_DISCONNECT:
processPRDisconnectEvent(vm); processPRDisconnectEvent(vm);

View File

@ -316,7 +316,7 @@ qemuProcessHandleMonitorEOF(qemuMonitor *mon,
} }
qemuProcessEventSubmit(vm, QEMU_PROCESS_EVENT_MONITOR_EOF, qemuProcessEventSubmit(vm, QEMU_PROCESS_EVENT_MONITOR_EOF,
0, 0, NULL); 0, 0, GINT_TO_POINTER(vm->def->id));
/* We don't want this EOF handler to be called over and over while the /* We don't want this EOF handler to be called over and over while the
* thread is waiting for a job. * thread is waiting for a job.