 c265e976f4
			
		
	
	
		c265e976f4
		
	
	
	
	
		
			
			Set cpu->running without taking the cpu_list lock, only requiring it if there is a concurrent exclusive section. This requires adding a new field to CPUState, which records whether a running CPU is being counted in pending_cpus. When an exclusive section is started concurrently with cpu_exec_start, cpu_exec_start can use the new field to determine if it has to wait for the end of the exclusive section. Likewise, cpu_exec_end can use it to see if start_exclusive is waiting for that CPU. This a separate patch for easier bisection of issues. Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
		
			
				
	
	
		
			353 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			353 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * CPU thread main loop - common bits for user and system mode emulation
 | |
|  *
 | |
|  *  Copyright (c) 2003-2005 Fabrice Bellard
 | |
|  *
 | |
|  * This library is free software; you can redistribute it and/or
 | |
|  * modify it under the terms of the GNU Lesser General Public
 | |
|  * License as published by the Free Software Foundation; either
 | |
|  * version 2 of the License, or (at your option) any later version.
 | |
|  *
 | |
|  * This library is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | |
|  * Lesser General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU Lesser General Public
 | |
|  * License along with this library; if not, see <http://www.gnu.org/licenses/>.
 | |
|  */
 | |
| 
 | |
| #include "qemu/osdep.h"
 | |
| #include "qemu/main-loop.h"
 | |
| #include "exec/cpu-common.h"
 | |
| #include "qom/cpu.h"
 | |
| #include "sysemu/cpus.h"
 | |
| 
 | |
| static QemuMutex qemu_cpu_list_lock;
 | |
| static QemuCond exclusive_cond;
 | |
| static QemuCond exclusive_resume;
 | |
| static QemuCond qemu_work_cond;
 | |
| 
 | |
| /* >= 1 if a thread is inside start_exclusive/end_exclusive.  Written
 | |
|  * under qemu_cpu_list_lock, read with atomic operations.
 | |
|  */
 | |
| static int pending_cpus;
 | |
| 
 | |
| void qemu_init_cpu_list(void)
 | |
| {
 | |
|     /* This is needed because qemu_init_cpu_list is also called by the
 | |
|      * child process in a fork.  */
 | |
|     pending_cpus = 0;
 | |
| 
 | |
|     qemu_mutex_init(&qemu_cpu_list_lock);
 | |
|     qemu_cond_init(&exclusive_cond);
 | |
|     qemu_cond_init(&exclusive_resume);
 | |
|     qemu_cond_init(&qemu_work_cond);
 | |
| }
 | |
| 
 | |
| void cpu_list_lock(void)
 | |
| {
 | |
|     qemu_mutex_lock(&qemu_cpu_list_lock);
 | |
| }
 | |
| 
 | |
| void cpu_list_unlock(void)
 | |
| {
 | |
|     qemu_mutex_unlock(&qemu_cpu_list_lock);
 | |
| }
 | |
| 
 | |
| static bool cpu_index_auto_assigned;
 | |
| 
 | |
| static int cpu_get_free_index(void)
 | |
| {
 | |
|     CPUState *some_cpu;
 | |
|     int cpu_index = 0;
 | |
| 
 | |
|     cpu_index_auto_assigned = true;
 | |
|     CPU_FOREACH(some_cpu) {
 | |
|         cpu_index++;
 | |
|     }
 | |
|     return cpu_index;
 | |
| }
 | |
| 
 | |
| static void finish_safe_work(CPUState *cpu)
 | |
| {
 | |
|     cpu_exec_start(cpu);
 | |
|     cpu_exec_end(cpu);
 | |
| }
 | |
| 
 | |
| void cpu_list_add(CPUState *cpu)
 | |
| {
 | |
|     qemu_mutex_lock(&qemu_cpu_list_lock);
 | |
|     if (cpu->cpu_index == UNASSIGNED_CPU_INDEX) {
 | |
|         cpu->cpu_index = cpu_get_free_index();
 | |
|         assert(cpu->cpu_index != UNASSIGNED_CPU_INDEX);
 | |
|     } else {
 | |
|         assert(!cpu_index_auto_assigned);
 | |
|     }
 | |
|     QTAILQ_INSERT_TAIL(&cpus, cpu, node);
 | |
|     qemu_mutex_unlock(&qemu_cpu_list_lock);
 | |
| 
 | |
|     finish_safe_work(cpu);
 | |
| }
 | |
| 
 | |
| void cpu_list_remove(CPUState *cpu)
 | |
| {
 | |
|     qemu_mutex_lock(&qemu_cpu_list_lock);
 | |
|     if (!QTAILQ_IN_USE(cpu, node)) {
 | |
|         /* there is nothing to undo since cpu_exec_init() hasn't been called */
 | |
|         qemu_mutex_unlock(&qemu_cpu_list_lock);
 | |
|         return;
 | |
|     }
 | |
| 
 | |
|     assert(!(cpu_index_auto_assigned && cpu != QTAILQ_LAST(&cpus, CPUTailQ)));
 | |
| 
 | |
|     QTAILQ_REMOVE(&cpus, cpu, node);
 | |
|     cpu->cpu_index = UNASSIGNED_CPU_INDEX;
 | |
|     qemu_mutex_unlock(&qemu_cpu_list_lock);
 | |
| }
 | |
| 
 | |
| struct qemu_work_item {
 | |
|     struct qemu_work_item *next;
 | |
|     run_on_cpu_func func;
 | |
|     void *data;
 | |
|     bool free, exclusive, done;
 | |
| };
 | |
| 
 | |
| static void queue_work_on_cpu(CPUState *cpu, struct qemu_work_item *wi)
 | |
| {
 | |
|     qemu_mutex_lock(&cpu->work_mutex);
 | |
|     if (cpu->queued_work_first == NULL) {
 | |
|         cpu->queued_work_first = wi;
 | |
|     } else {
 | |
|         cpu->queued_work_last->next = wi;
 | |
|     }
 | |
|     cpu->queued_work_last = wi;
 | |
|     wi->next = NULL;
 | |
|     wi->done = false;
 | |
|     qemu_mutex_unlock(&cpu->work_mutex);
 | |
| 
 | |
|     qemu_cpu_kick(cpu);
 | |
| }
 | |
| 
 | |
| void do_run_on_cpu(CPUState *cpu, run_on_cpu_func func, void *data,
 | |
|                    QemuMutex *mutex)
 | |
| {
 | |
|     struct qemu_work_item wi;
 | |
| 
 | |
|     if (qemu_cpu_is_self(cpu)) {
 | |
|         func(cpu, data);
 | |
|         return;
 | |
|     }
 | |
| 
 | |
|     wi.func = func;
 | |
|     wi.data = data;
 | |
|     wi.done = false;
 | |
|     wi.free = false;
 | |
|     wi.exclusive = false;
 | |
| 
 | |
|     queue_work_on_cpu(cpu, &wi);
 | |
|     while (!atomic_mb_read(&wi.done)) {
 | |
|         CPUState *self_cpu = current_cpu;
 | |
| 
 | |
|         qemu_cond_wait(&qemu_work_cond, mutex);
 | |
|         current_cpu = self_cpu;
 | |
|     }
 | |
| }
 | |
| 
 | |
| void async_run_on_cpu(CPUState *cpu, run_on_cpu_func func, void *data)
 | |
| {
 | |
|     struct qemu_work_item *wi;
 | |
| 
 | |
|     wi = g_malloc0(sizeof(struct qemu_work_item));
 | |
|     wi->func = func;
 | |
|     wi->data = data;
 | |
|     wi->free = true;
 | |
| 
 | |
|     queue_work_on_cpu(cpu, wi);
 | |
| }
 | |
| 
 | |
| /* Wait for pending exclusive operations to complete.  The CPU list lock
 | |
|    must be held.  */
 | |
| static inline void exclusive_idle(void)
 | |
| {
 | |
|     while (pending_cpus) {
 | |
|         qemu_cond_wait(&exclusive_resume, &qemu_cpu_list_lock);
 | |
|     }
 | |
| }
 | |
| 
 | |
| /* Start an exclusive operation.
 | |
|    Must only be called from outside cpu_exec.  */
 | |
| void start_exclusive(void)
 | |
| {
 | |
|     CPUState *other_cpu;
 | |
|     int running_cpus;
 | |
| 
 | |
|     qemu_mutex_lock(&qemu_cpu_list_lock);
 | |
|     exclusive_idle();
 | |
| 
 | |
|     /* Make all other cpus stop executing.  */
 | |
|     atomic_set(&pending_cpus, 1);
 | |
| 
 | |
|     /* Write pending_cpus before reading other_cpu->running.  */
 | |
|     smp_mb();
 | |
|     running_cpus = 0;
 | |
|     CPU_FOREACH(other_cpu) {
 | |
|         if (atomic_read(&other_cpu->running)) {
 | |
|             other_cpu->has_waiter = true;
 | |
|             running_cpus++;
 | |
|             qemu_cpu_kick(other_cpu);
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     atomic_set(&pending_cpus, running_cpus + 1);
 | |
|     while (pending_cpus > 1) {
 | |
|         qemu_cond_wait(&exclusive_cond, &qemu_cpu_list_lock);
 | |
|     }
 | |
| 
 | |
|     /* Can release mutex, no one will enter another exclusive
 | |
|      * section until end_exclusive resets pending_cpus to 0.
 | |
|      */
 | |
|     qemu_mutex_unlock(&qemu_cpu_list_lock);
 | |
| }
 | |
| 
 | |
| /* Finish an exclusive operation.  */
 | |
| void end_exclusive(void)
 | |
| {
 | |
|     qemu_mutex_lock(&qemu_cpu_list_lock);
 | |
|     atomic_set(&pending_cpus, 0);
 | |
|     qemu_cond_broadcast(&exclusive_resume);
 | |
|     qemu_mutex_unlock(&qemu_cpu_list_lock);
 | |
| }
 | |
| 
 | |
| /* Wait for exclusive ops to finish, and begin cpu execution.  */
 | |
| void cpu_exec_start(CPUState *cpu)
 | |
| {
 | |
|     atomic_set(&cpu->running, true);
 | |
| 
 | |
|     /* Write cpu->running before reading pending_cpus.  */
 | |
|     smp_mb();
 | |
| 
 | |
|     /* 1. start_exclusive saw cpu->running == true and pending_cpus >= 1.
 | |
|      * After taking the lock we'll see cpu->has_waiter == true and run---not
 | |
|      * for long because start_exclusive kicked us.  cpu_exec_end will
 | |
|      * decrement pending_cpus and signal the waiter.
 | |
|      *
 | |
|      * 2. start_exclusive saw cpu->running == false but pending_cpus >= 1.
 | |
|      * This includes the case when an exclusive item is running now.
 | |
|      * Then we'll see cpu->has_waiter == false and wait for the item to
 | |
|      * complete.
 | |
|      *
 | |
|      * 3. pending_cpus == 0.  Then start_exclusive is definitely going to
 | |
|      * see cpu->running == true, and it will kick the CPU.
 | |
|      */
 | |
|     if (unlikely(atomic_read(&pending_cpus))) {
 | |
|         qemu_mutex_lock(&qemu_cpu_list_lock);
 | |
|         if (!cpu->has_waiter) {
 | |
|             /* Not counted in pending_cpus, let the exclusive item
 | |
|              * run.  Since we have the lock, just set cpu->running to true
 | |
|              * while holding it; no need to check pending_cpus again.
 | |
|              */
 | |
|             atomic_set(&cpu->running, false);
 | |
|             exclusive_idle();
 | |
|             /* Now pending_cpus is zero.  */
 | |
|             atomic_set(&cpu->running, true);
 | |
|         } else {
 | |
|             /* Counted in pending_cpus, go ahead and release the
 | |
|              * waiter at cpu_exec_end.
 | |
|              */
 | |
|         }
 | |
|         qemu_mutex_unlock(&qemu_cpu_list_lock);
 | |
|     }
 | |
| }
 | |
| 
 | |
| /* Mark cpu as not executing, and release pending exclusive ops.  */
 | |
| void cpu_exec_end(CPUState *cpu)
 | |
| {
 | |
|     atomic_set(&cpu->running, false);
 | |
| 
 | |
|     /* Write cpu->running before reading pending_cpus.  */
 | |
|     smp_mb();
 | |
| 
 | |
|     /* 1. start_exclusive saw cpu->running == true.  Then it will increment
 | |
|      * pending_cpus and wait for exclusive_cond.  After taking the lock
 | |
|      * we'll see cpu->has_waiter == true.
 | |
|      *
 | |
|      * 2. start_exclusive saw cpu->running == false but here pending_cpus >= 1.
 | |
|      * This includes the case when an exclusive item started after setting
 | |
|      * cpu->running to false and before we read pending_cpus.  Then we'll see
 | |
|      * cpu->has_waiter == false and not touch pending_cpus.  The next call to
 | |
|      * cpu_exec_start will run exclusive_idle if still necessary, thus waiting
 | |
|      * for the item to complete.
 | |
|      *
 | |
|      * 3. pending_cpus == 0.  Then start_exclusive is definitely going to
 | |
|      * see cpu->running == false, and it can ignore this CPU until the
 | |
|      * next cpu_exec_start.
 | |
|      */
 | |
|     if (unlikely(atomic_read(&pending_cpus))) {
 | |
|         qemu_mutex_lock(&qemu_cpu_list_lock);
 | |
|         if (cpu->has_waiter) {
 | |
|             cpu->has_waiter = false;
 | |
|             atomic_set(&pending_cpus, pending_cpus - 1);
 | |
|             if (pending_cpus == 1) {
 | |
|                 qemu_cond_signal(&exclusive_cond);
 | |
|             }
 | |
|         }
 | |
|         qemu_mutex_unlock(&qemu_cpu_list_lock);
 | |
|     }
 | |
| }
 | |
| 
 | |
| void async_safe_run_on_cpu(CPUState *cpu, run_on_cpu_func func, void *data)
 | |
| {
 | |
|     struct qemu_work_item *wi;
 | |
| 
 | |
|     wi = g_malloc0(sizeof(struct qemu_work_item));
 | |
|     wi->func = func;
 | |
|     wi->data = data;
 | |
|     wi->free = true;
 | |
|     wi->exclusive = true;
 | |
| 
 | |
|     queue_work_on_cpu(cpu, wi);
 | |
| }
 | |
| 
 | |
| void process_queued_cpu_work(CPUState *cpu)
 | |
| {
 | |
|     struct qemu_work_item *wi;
 | |
| 
 | |
|     if (cpu->queued_work_first == NULL) {
 | |
|         return;
 | |
|     }
 | |
| 
 | |
|     qemu_mutex_lock(&cpu->work_mutex);
 | |
|     while (cpu->queued_work_first != NULL) {
 | |
|         wi = cpu->queued_work_first;
 | |
|         cpu->queued_work_first = wi->next;
 | |
|         if (!cpu->queued_work_first) {
 | |
|             cpu->queued_work_last = NULL;
 | |
|         }
 | |
|         qemu_mutex_unlock(&cpu->work_mutex);
 | |
|         if (wi->exclusive) {
 | |
|             /* Running work items outside the BQL avoids the following deadlock:
 | |
|              * 1) start_exclusive() is called with the BQL taken while another
 | |
|              * CPU is running; 2) cpu_exec in the other CPU tries to takes the
 | |
|              * BQL, so it goes to sleep; start_exclusive() is sleeping too, so
 | |
|              * neither CPU can proceed.
 | |
|              */
 | |
|             qemu_mutex_unlock_iothread();
 | |
|             start_exclusive();
 | |
|             wi->func(cpu, wi->data);
 | |
|             end_exclusive();
 | |
|             qemu_mutex_lock_iothread();
 | |
|         } else {
 | |
|             wi->func(cpu, wi->data);
 | |
|         }
 | |
|         qemu_mutex_lock(&cpu->work_mutex);
 | |
|         if (wi->free) {
 | |
|             g_free(wi);
 | |
|         } else {
 | |
|             atomic_mb_set(&wi->done, true);
 | |
|         }
 | |
|     }
 | |
|     qemu_mutex_unlock(&cpu->work_mutex);
 | |
|     qemu_cond_broadcast(&qemu_work_cond);
 | |
| }
 |