Blame - src/api.c - hafnium/hafnium.git - TrustedFirmware Git Browser

blob: 90dac1949da19a7f458c6762891af15fd8665676 [file] [log] [blame]

Andrew Scull	1883487	2018-10-12 11:48:09 +0100	[diff] [blame]	1	/*
Andrew Walbran	692b325	2019-03-07 15:51:31 +0000	[diff] [blame]	2	* Copyright 2018 The Hafnium Authors.
Andrew Scull	1883487	2018-10-12 11:48:09 +0100	[diff] [blame]	3	*
				4	* Licensed under the Apache License, Version 2.0 (the "License");
				5	* you may not use this file except in compliance with the License.
				6	* You may obtain a copy of the License at
				7	*
				8	* https://www.apache.org/licenses/LICENSE-2.0
				9	*
				10	* Unless required by applicable law or agreed to in writing, software
				11	* distributed under the License is distributed on an "AS IS" BASIS,
				12	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
				13	* See the License for the specific language governing permissions and
				14	* limitations under the License.
				15	*/
				16
Andrew Scull	18c78fc	2018-08-20 12:57:41 +0100	[diff] [blame]	17	#include "hf/api.h"
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	18
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	19	#include "hf/arch/cpu.h"
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	20	#include "hf/arch/timer.h"
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	21
Andrew Scull	877ae4b	2019-07-02 12:52:33 +0100	[diff] [blame]	22	#include "hf/check.h"
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	23	#include "hf/dlog.h"
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	24	#include "hf/mm.h"
Andrew Walbran	b037d5b	2019-06-25 17:19:41 +0100	[diff] [blame]	25	#include "hf/spci.h"
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	26	#include "hf/spinlock.h"
Andrew Scull	877ae4b	2019-07-02 12:52:33 +0100	[diff] [blame]	27	#include "hf/static_assert.h"
Andrew Scull	8d9e121	2019-04-05 13:52:55 +0100	[diff] [blame]	28	#include "hf/std.h"
Andrew Scull	18c78fc	2018-08-20 12:57:41 +0100	[diff] [blame]	29	#include "hf/vm.h"
				30
Andrew Scull	f35a5c9	2018-08-07 18:09:46 +0100	[diff] [blame]	31	#include "vmapi/hf/call.h"
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	32	#include "vmapi/hf/spci.h"
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	33
Wedson Almeida Filho	ba641ef	2018-12-03 04:19:44 +0000	[diff] [blame]	34	/*
				35	* To eliminate the risk of deadlocks, we define a partial order for the
				36	* acquisition of locks held concurrently by the same physical CPU. Our current
				37	* ordering requirements are as follows:
				38	*
Andrew Scull	ba79b0a	2019-07-03 11:26:53 +0100	[diff] [blame]	39	* vm::lock -> vcpu::lock -> mm_stage1_lock
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	40	*
Andrew Scull	4caadaf	2019-07-03 13:13:47 +0100	[diff] [blame]	41	* Locks of the same kind require the lock of lowest address to be locked first,
				42	* see `sl_lock_both()`.
Wedson Almeida Filho	ba641ef	2018-12-03 04:19:44 +0000	[diff] [blame]	43	*/
				44
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	45	static_assert(HF_MAILBOX_SIZE == PAGE_SIZE,
Andrew Scull	13652af	2018-09-17 14:49:08 +0100	[diff] [blame]	46	"Currently, a page is mapped for the send and receive buffers so "
				47	"the maximum request is the size of a page.");
				48
Wedson Almeida Filho	9ed8da5	2018-12-17 16:09:11 +0000	[diff] [blame]	49	static struct mpool api_page_pool;
Wedson Almeida Filho	22d5eaa	2018-12-16 00:38:49 +0000	[diff] [blame]	50
				51	/**
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	52	* Initialises the API page pool by taking ownership of the contents of the
				53	* given page pool.
Wedson Almeida Filho	22d5eaa	2018-12-16 00:38:49 +0000	[diff] [blame]	54	*/
				55	void api_init(struct mpool *ppool)
				56	{
Wedson Almeida Filho	9ed8da5	2018-12-17 16:09:11 +0000	[diff] [blame]	57	mpool_init_from(&api_page_pool, ppool);
Wedson Almeida Filho	22d5eaa	2018-12-16 00:38:49 +0000	[diff] [blame]	58	}
				59
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	60	/**
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	61	* Switches the physical CPU back to the corresponding vcpu of the primary VM.
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	62	*
				63	* This triggers the scheduling logic to run. Run in the context of secondary VM
				64	* to cause HF_VCPU_RUN to return and the primary VM to regain control of the
				65	* cpu.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	66	*/
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	67	static struct vcpu api_switch_to_primary(struct vcpu current,
Wedson Almeida Filho	ba641ef	2018-12-03 04:19:44 +0000	[diff] [blame]	68	struct hf_vcpu_run_return primary_ret,
				69	enum vcpu_state secondary_state)
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	70	{
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	71	struct vm *primary = vm_find(HF_PRIMARY_VM_ID);
Andrew Walbran	e1310df	2019-04-29 17:28:28 +0100	[diff] [blame]	72	struct vcpu *next = vm_get_vcpu(primary, cpu_index(current->cpu));
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	73
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	74	/*
				75	* If the secondary is blocked but has a timer running, sleep until the
				76	* timer fires rather than indefinitely.
				77	*/
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	78	switch (primary_ret.code) {
				79	case HF_VCPU_RUN_WAIT_FOR_INTERRUPT:
				80	case HF_VCPU_RUN_WAIT_FOR_MESSAGE:
				81	primary_ret.sleep.ns =
				82	arch_timer_enabled_current()
				83	? arch_timer_remaining_ns_current()
				84	: HF_SLEEP_INDEFINITE;
				85	break;
				86
				87	default:
				88	/* Do nothing. */
				89	break;
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	90	}
				91
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	92	/* Set the return value for the primary VM's call to HF_VCPU_RUN. */
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	93	arch_regs_set_retval(&next->regs,
				94	hf_vcpu_run_return_encode(primary_ret));
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	95
Wedson Almeida Filho	ba641ef	2018-12-03 04:19:44 +0000	[diff] [blame]	96	/* Mark the current vcpu as waiting. */
				97	sl_lock(&current->lock);
				98	current->state = secondary_state;
				99	sl_unlock(&current->lock);
				100
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	101	return next;
				102	}
				103
				104	/**
Andrew Scull	33fecd3	2019-01-08 14:48:27 +0000	[diff] [blame]	105	* Returns to the primary vm and signals that the vcpu still has work to do so.
				106	*/
				107	struct vcpu api_preempt(struct vcpu current)
				108	{
				109	struct hf_vcpu_run_return ret = {
				110	.code = HF_VCPU_RUN_PREEMPTED,
				111	};
				112
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	113	return api_switch_to_primary(current, ret, VCPU_STATE_READY);
Andrew Scull	33fecd3	2019-01-08 14:48:27 +0000	[diff] [blame]	114	}
				115
				116	/**
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	117	* Puts the current vcpu in wait for interrupt mode, and returns to the primary
				118	* vm.
				119	*/
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	120	struct vcpu api_wait_for_interrupt(struct vcpu current)
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	121	{
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	122	struct hf_vcpu_run_return ret = {
				123	.code = HF_VCPU_RUN_WAIT_FOR_INTERRUPT,
				124	};
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	125
Wedson Almeida Filho	ba641ef	2018-12-03 04:19:44 +0000	[diff] [blame]	126	return api_switch_to_primary(current, ret,
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	127	VCPU_STATE_BLOCKED_INTERRUPT);
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	128	}
				129
				130	/**
Andrew Walbran	3364565	2019-04-15 12:29:31 +0100	[diff] [blame]	131	* Puts the current vCPU in off mode, and returns to the primary VM.
				132	*/
				133	struct vcpu api_vcpu_off(struct vcpu current)
				134	{
				135	struct hf_vcpu_run_return ret = {
				136	.code = HF_VCPU_RUN_WAIT_FOR_INTERRUPT,
				137	};
				138
				139	/*
				140	* Disable the timer, so the scheduler doesn't get told to call back
				141	* based on it.
				142	*/
				143	arch_timer_disable_current();
				144
				145	return api_switch_to_primary(current, ret, VCPU_STATE_OFF);
				146	}
				147
				148	/**
Andrew Scull	66d62bf	2019-02-01 13:54:10 +0000	[diff] [blame]	149	* Returns to the primary vm to allow this cpu to be used for other tasks as the
				150	* vcpu does not have work to do at this moment. The current vcpu is marked as
Jose Marinho	135dff3	2019-02-28 10:25:57 +0000	[diff] [blame]	151	* ready to be scheduled again. This SPCI function always returns SPCI_SUCCESS.
Andrew Scull	66d62bf	2019-02-01 13:54:10 +0000	[diff] [blame]	152	*/
Jose Marinho	135dff3	2019-02-28 10:25:57 +0000	[diff] [blame]	153	int32_t api_spci_yield(struct vcpu current, struct vcpu *next)
Andrew Scull	66d62bf	2019-02-01 13:54:10 +0000	[diff] [blame]	154	{
				155	struct hf_vcpu_run_return ret = {
				156	.code = HF_VCPU_RUN_YIELD,
				157	};
				158
				159	if (current->vm->id == HF_PRIMARY_VM_ID) {
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	160	/* Noop on the primary as it makes the scheduling decisions. */
Jose Marinho	135dff3	2019-02-28 10:25:57 +0000	[diff] [blame]	161	return SPCI_SUCCESS;
Andrew Scull	66d62bf	2019-02-01 13:54:10 +0000	[diff] [blame]	162	}
				163
Jose Marinho	135dff3	2019-02-28 10:25:57 +0000	[diff] [blame]	164	*next = api_switch_to_primary(current, ret, VCPU_STATE_READY);
				165
				166	/* SPCI_YIELD always returns SPCI_SUCCESS. */
				167	return SPCI_SUCCESS;
Andrew Scull	66d62bf	2019-02-01 13:54:10 +0000	[diff] [blame]	168	}
				169
				170	/**
Andrew Walbran	3364565	2019-04-15 12:29:31 +0100	[diff] [blame]	171	* Switches to the primary so that it can switch to the target, or kick it if it
				172	* is already running on a different physical CPU.
				173	*/
				174	struct vcpu api_wake_up(struct vcpu current, struct vcpu *target_vcpu)
				175	{
				176	struct hf_vcpu_run_return ret = {
				177	.code = HF_VCPU_RUN_WAKE_UP,
				178	.wake_up.vm_id = target_vcpu->vm->id,
				179	.wake_up.vcpu = vcpu_index(target_vcpu),
				180	};
				181	return api_switch_to_primary(current, ret, VCPU_STATE_READY);
				182	}
				183
				184	/**
Andrew Scull	38772ab	2019-01-24 15:16:50 +0000	[diff] [blame]	185	* Aborts the vCPU and triggers its VM to abort fully.
Andrew Scull	9726c25	2019-01-23 13:44:19 +0000	[diff] [blame]	186	*/
				187	struct vcpu api_abort(struct vcpu current)
				188	{
				189	struct hf_vcpu_run_return ret = {
				190	.code = HF_VCPU_RUN_ABORTED,
				191	};
				192
				193	dlog("Aborting VM %u vCPU %u\n", current->vm->id, vcpu_index(current));
				194
				195	if (current->vm->id == HF_PRIMARY_VM_ID) {
				196	/* TODO: what to do when the primary aborts? */
				197	for (;;) {
				198	/* Do nothing. */
				199	}
				200	}
				201
				202	atomic_store_explicit(&current->vm->aborting, true,
				203	memory_order_relaxed);
				204
				205	/* TODO: free resources once all vCPUs abort. */
				206
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	207	return api_switch_to_primary(current, ret, VCPU_STATE_ABORTED);
Andrew Scull	9726c25	2019-01-23 13:44:19 +0000	[diff] [blame]	208	}
				209
				210	/**
Andrew Scull	55c4d8b	2018-12-18 18:50:18 +0000	[diff] [blame]	211	* Returns the ID of the VM.
				212	*/
Andrew Walbran	fc6cd9d	2019-06-25 15:23:27 +0100	[diff] [blame]	213	spci_vm_id_t api_vm_get_id(const struct vcpu *current)
Andrew Scull	55c4d8b	2018-12-18 18:50:18 +0000	[diff] [blame]	214	{
				215	return current->vm->id;
				216	}
				217
				218	/**
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	219	* Returns the number of VMs configured to run.
				220	*/
Andrew Walbran	52d9967	2019-06-25 15:51:11 +0100	[diff] [blame]	221	spci_vm_count_t api_vm_get_count(void)
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	222	{
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	223	return vm_get_count();
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	224	}
				225
				226	/**
				227	* Returns the number of vcpus configured in the given VM.
				228	*/
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	229	int64_t api_vcpu_get_count(spci_vm_id_t vm_id, const struct vcpu *current)
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	230	{
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	231	struct vm *vm;
				232
				233	/* Only the primary VM needs to know about vcpus for scheduling. */
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	234	if (current->vm->id != HF_PRIMARY_VM_ID) {
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	235	return -1;
Andrew Scull	7364a8e	2018-07-19 15:39:29 +0100	[diff] [blame]	236	}
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	237
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	238	vm = vm_find(vm_id);
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	239	if (vm == NULL) {
				240	return -1;
				241	}
				242
				243	return vm->vcpu_count;
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	244	}
				245
				246	/**
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	247	* This function is called by the architecture-specific context switching
				248	* function to indicate that register state for the given vcpu has been saved
				249	* and can therefore be used by other pcpus.
				250	*/
				251	void api_regs_state_saved(struct vcpu *vcpu)
				252	{
				253	sl_lock(&vcpu->lock);
				254	vcpu->regs_available = true;
				255	sl_unlock(&vcpu->lock);
				256	}
				257
				258	/**
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	259	* Retrieves the next waiter and removes it from the wait list if the VM's
				260	* mailbox is in a writable state.
				261	*/
				262	static struct wait_entry *api_fetch_waiter(struct vm_locked locked_vm)
				263	{
				264	struct wait_entry *entry;
				265	struct vm *vm = locked_vm.vm;
				266
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	267	if (vm->mailbox.state != MAILBOX_STATE_EMPTY \|\|
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	268	vm->mailbox.recv == NULL \|\| list_empty(&vm->mailbox.waiter_list)) {
				269	/* The mailbox is not writable or there are no waiters. */
				270	return NULL;
				271	}
				272
				273	/* Remove waiter from the wait list. */
				274	entry = CONTAINER_OF(vm->mailbox.waiter_list.next, struct wait_entry,
				275	wait_links);
				276	list_remove(&entry->wait_links);
				277	return entry;
				278	}
				279
				280	/**
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	281	* Assuming that the arguments have already been checked by the caller, injects
				282	* a virtual interrupt of the given ID into the given target vCPU. This doesn't
				283	* cause the vCPU to actually be run immediately; it will be taken when the vCPU
				284	* is next run, which is up to the scheduler.
				285	*
				286	* Returns:
				287	* - 0 on success if no further action is needed.
				288	* - 1 if it was called by the primary VM and the primary VM now needs to wake
				289	* up or kick the target vCPU.
				290	*/
Andrew Walbran	fc9d438	2019-05-10 18:07:21 +0100	[diff] [blame]	291	static int64_t internal_interrupt_inject(struct vcpu *target_vcpu,
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	292	uint32_t intid, struct vcpu *current,
				293	struct vcpu **next)
				294	{
				295	uint32_t intid_index = intid / INTERRUPT_REGISTER_BITS;
				296	uint32_t intid_mask = 1u << (intid % INTERRUPT_REGISTER_BITS);
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	297	int64_t ret = 0;
				298
				299	sl_lock(&target_vcpu->lock);
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	300
				301	/*
				302	* We only need to change state and (maybe) trigger a virtual IRQ if it
				303	* is enabled and was not previously pending. Otherwise we can skip
				304	* everything except setting the pending bit.
				305	*
				306	* If you change this logic make sure to update the need_vm_lock logic
				307	* above to match.
				308	*/
				309	if (!(target_vcpu->interrupts.interrupt_enabled[intid_index] &
				310	~target_vcpu->interrupts.interrupt_pending[intid_index] &
				311	intid_mask)) {
				312	goto out;
				313	}
				314
				315	/* Increment the count. */
				316	target_vcpu->interrupts.enabled_and_pending_count++;
				317
				318	/*
				319	* Only need to update state if there was not already an
				320	* interrupt enabled and pending.
				321	*/
				322	if (target_vcpu->interrupts.enabled_and_pending_count != 1) {
				323	goto out;
				324	}
				325
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	326	if (current->vm->id == HF_PRIMARY_VM_ID) {
				327	/*
				328	* If the call came from the primary VM, let it know that it
				329	* should run or kick the target vCPU.
				330	*/
				331	ret = 1;
				332	} else if (current != target_vcpu && next != NULL) {
Andrew Walbran	3364565	2019-04-15 12:29:31 +0100	[diff] [blame]	333	*next = api_wake_up(current, target_vcpu);
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	334	}
				335
				336	out:
				337	/* Either way, make it pending. */
				338	target_vcpu->interrupts.interrupt_pending[intid_index] \|= intid_mask;
				339
				340	sl_unlock(&target_vcpu->lock);
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	341
				342	return ret;
				343	}
				344
				345	/**
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	346	* Prepares the vcpu to run by updating its state and fetching whether a return
				347	* value needs to be forced onto the vCPU.
				348	*/
Andrew Scull	38772ab	2019-01-24 15:16:50 +0000	[diff] [blame]	349	static bool api_vcpu_prepare_run(const struct vcpu current, struct vcpu vcpu,
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	350	struct hf_vcpu_run_return *run_ret)
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	351	{
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	352	bool need_vm_lock;
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	353	bool ret;
				354
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	355	/*
Andrew Scull	4caadaf	2019-07-03 13:13:47 +0100	[diff] [blame]	356	* Wait until the registers become available. All locks must be released
				357	* between iterations of this loop to avoid potential deadlocks if, on
				358	* any path, a lock needs to be taken after taking the decision to
				359	* switch context but before the registers have been saved.
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	360	*
Andrew Scull	4caadaf	2019-07-03 13:13:47 +0100	[diff] [blame]	361	* The VM lock is not needed in the common case so it must only be taken
				362	* when it is going to be needed. This ensures there are no inter-vCPU
				363	* dependencies in the common run case meaning the sensitive context
				364	* switch performance is consistent.
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	365	*/
				366	for (;;) {
				367	sl_lock(&vcpu->lock);
				368
				369	/* The VM needs to be locked to deliver mailbox messages. */
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	370	need_vm_lock = vcpu->state == VCPU_STATE_BLOCKED_MAILBOX;
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	371	if (need_vm_lock) {
				372	sl_unlock(&vcpu->lock);
				373	sl_lock(&vcpu->vm->lock);
				374	sl_lock(&vcpu->lock);
				375	}
				376
				377	if (vcpu->regs_available) {
				378	break;
				379	}
				380
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	381	if (vcpu->state == VCPU_STATE_RUNNING) {
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	382	/*
				383	* vCPU is running on another pCPU.
				384	*
Andrew Walbran	abf88fb	2019-06-21 12:17:47 +0100	[diff] [blame]	385	* It's ok not to return the sleep duration here because
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	386	* the other physical CPU that is currently running this
Andrew Walbran	abf88fb	2019-06-21 12:17:47 +0100	[diff] [blame]	387	* vCPU will return the sleep duration if needed. The
				388	* default return value is
				389	* HF_VCPU_RUN_WAIT_FOR_INTERRUPT, so no need to set it
				390	* explicitly.
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	391	*/
				392	ret = false;
				393	goto out;
				394	}
				395
				396	sl_unlock(&vcpu->lock);
				397	if (need_vm_lock) {
				398	sl_unlock(&vcpu->vm->lock);
				399	}
				400	}
Andrew Scull	9726c25	2019-01-23 13:44:19 +0000	[diff] [blame]	401
				402	if (atomic_load_explicit(&vcpu->vm->aborting, memory_order_relaxed)) {
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	403	if (vcpu->state != VCPU_STATE_ABORTED) {
Andrew Scull	8233128	2019-01-25 10:29:34 +0000	[diff] [blame]	404	dlog("Aborting VM %u vCPU %u\n", vcpu->vm->id,
				405	vcpu_index(vcpu));
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	406	vcpu->state = VCPU_STATE_ABORTED;
Andrew Scull	9726c25	2019-01-23 13:44:19 +0000	[diff] [blame]	407	}
				408	ret = false;
				409	goto out;
				410	}
				411
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	412	switch (vcpu->state) {
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	413	case VCPU_STATE_RUNNING:
				414	case VCPU_STATE_OFF:
				415	case VCPU_STATE_ABORTED:
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	416	ret = false;
				417	goto out;
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	418
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	419	case VCPU_STATE_BLOCKED_MAILBOX:
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	420	/*
				421	* A pending message allows the vCPU to run so the message can
				422	* be delivered directly.
				423	*/
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	424	if (vcpu->vm->mailbox.state == MAILBOX_STATE_RECEIVED) {
Jose Marinho	3e2442f	2019-03-12 13:30:37 +0000	[diff] [blame]	425	arch_regs_set_retval(&vcpu->regs, SPCI_SUCCESS);
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	426	vcpu->vm->mailbox.state = MAILBOX_STATE_READ;
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	427	break;
				428	}
				429	/* Fall through. */
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	430	case VCPU_STATE_BLOCKED_INTERRUPT:
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	431	/* Allow virtual interrupts to be delivered. */
				432	if (vcpu->interrupts.enabled_and_pending_count > 0) {
				433	break;
				434	}
				435
				436	/* The timer expired so allow the interrupt to be delivered. */
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	437	if (arch_timer_pending(&vcpu->regs)) {
				438	break;
				439	}
				440
				441	/*
				442	* The vCPU is not ready to run, return the appropriate code to
				443	* the primary which called vcpu_run.
				444	*/
				445	if (arch_timer_enabled(&vcpu->regs)) {
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	446	run_ret->code =
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	447	vcpu->state == VCPU_STATE_BLOCKED_MAILBOX
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	448	? HF_VCPU_RUN_WAIT_FOR_MESSAGE
				449	: HF_VCPU_RUN_WAIT_FOR_INTERRUPT;
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	450	run_ret->sleep.ns =
				451	arch_timer_remaining_ns(&vcpu->regs);
				452	}
				453
				454	ret = false;
				455	goto out;
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	456
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	457	case VCPU_STATE_READY:
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	458	break;
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	459	}
				460
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	461	/* It has been decided that the vCPU should be run. */
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	462	vcpu->cpu = current->cpu;
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	463	vcpu->state = VCPU_STATE_RUNNING;
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	464
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	465	/*
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	466	* Mark the registers as unavailable now that we're about to reflect
				467	* them onto the real registers. This will also prevent another physical
				468	* CPU from trying to read these registers.
				469	*/
				470	vcpu->regs_available = false;
				471
				472	ret = true;
				473
				474	out:
				475	sl_unlock(&vcpu->lock);
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	476	if (need_vm_lock) {
				477	sl_unlock(&vcpu->vm->lock);
				478	}
				479
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	480	return ret;
				481	}
				482
				483	/**
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	484	* Runs the given vcpu of the given vm.
				485	*/
Andrew Walbran	b037d5b	2019-06-25 17:19:41 +0100	[diff] [blame]	486	struct hf_vcpu_run_return api_vcpu_run(spci_vm_id_t vm_id,
				487	spci_vcpu_index_t vcpu_idx,
Andrew Scull	38772ab	2019-01-24 15:16:50 +0000	[diff] [blame]	488	const struct vcpu *current,
				489	struct vcpu **next)
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	490	{
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	491	struct vm *vm;
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	492	struct vcpu *vcpu;
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	493	struct hf_vcpu_run_return ret = {
				494	.code = HF_VCPU_RUN_WAIT_FOR_INTERRUPT,
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	495	.sleep.ns = HF_SLEEP_INDEFINITE,
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	496	};
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	497
				498	/* Only the primary VM can switch vcpus. */
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	499	if (current->vm->id != HF_PRIMARY_VM_ID) {
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	500	goto out;
Andrew Scull	7364a8e	2018-07-19 15:39:29 +0100	[diff] [blame]	501	}
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	502
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	503	/* Only secondary VM vcpus can be run. */
				504	if (vm_id == HF_PRIMARY_VM_ID) {
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	505	goto out;
Andrew Scull	7364a8e	2018-07-19 15:39:29 +0100	[diff] [blame]	506	}
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	507
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	508	/* The requested VM must exist. */
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	509	vm = vm_find(vm_id);
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	510	if (vm == NULL) {
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	511	goto out;
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	512	}
				513
				514	/* The requested vcpu must exist. */
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	515	if (vcpu_idx >= vm->vcpu_count) {
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	516	goto out;
Andrew Scull	7364a8e	2018-07-19 15:39:29 +0100	[diff] [blame]	517	}
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	518
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	519	/* Update state if allowed. */
Andrew Walbran	e1310df	2019-04-29 17:28:28 +0100	[diff] [blame]	520	vcpu = vm_get_vcpu(vm, vcpu_idx);
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	521	if (!api_vcpu_prepare_run(current, vcpu, &ret)) {
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	522	goto out;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	523	}
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	524
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	525	/*
				526	* Inject timer interrupt if timer has expired. It's safe to access
				527	* vcpu->regs here because api_vcpu_prepare_run already made sure that
				528	* regs_available was true (and then set it to false) before returning
				529	* true.
				530	*/
				531	if (arch_timer_pending(&vcpu->regs)) {
				532	/* Make virtual timer interrupt pending. */
Andrew Walbran	fc9d438	2019-05-10 18:07:21 +0100	[diff] [blame]	533	internal_interrupt_inject(vcpu, HF_VIRTUAL_TIMER_INTID, vcpu,
				534	NULL);
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	535
				536	/*
				537	* Set the mask bit so the hardware interrupt doesn't fire
				538	* again. Ideally we wouldn't do this because it affects what
				539	* the secondary vCPU sees, but if we don't then we end up with
				540	* a loop of the interrupt firing each time we try to return to
				541	* the secondary vCPU.
				542	*/
				543	arch_timer_mask(&vcpu->regs);
				544	}
				545
Andrew Scull	33fecd3	2019-01-08 14:48:27 +0000	[diff] [blame]	546	/* Switch to the vcpu. */
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	547	*next = vcpu;
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	548
Andrew Scull	33fecd3	2019-01-08 14:48:27 +0000	[diff] [blame]	549	/*
				550	* Set a placeholder return code to the scheduler. This will be
				551	* overwritten when the switch back to the primary occurs.
				552	*/
				553	ret.code = HF_VCPU_RUN_PREEMPTED;
				554
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	555	out:
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	556	return ret;
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	557	}
				558
				559	/**
Andrew Scull	81e8509	2018-12-12 12:56:20 +0000	[diff] [blame]	560	* Check that the mode indicates memory that is valid, owned and exclusive.
				561	*/
Andrew Scull	cbefbdb	2019-01-11 16:36:26 +0000	[diff] [blame]	562	static bool api_mode_valid_owned_and_exclusive(int mode)
Andrew Scull	81e8509	2018-12-12 12:56:20 +0000	[diff] [blame]	563	{
				564	return (mode & (MM_MODE_INVALID \| MM_MODE_UNOWNED \| MM_MODE_SHARED)) ==
				565	0;
				566	}
				567
				568	/**
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	569	* Determines the value to be returned by api_vm_configure and api_mailbox_clear
				570	* after they've succeeded. If a secondary VM is running and there are waiters,
				571	* it also switches back to the primary VM for it to wake waiters up.
				572	*/
				573	static int64_t api_waiter_result(struct vm_locked locked_vm,
				574	struct vcpu current, struct vcpu *next)
				575	{
				576	struct vm *vm = locked_vm.vm;
				577	struct hf_vcpu_run_return ret = {
				578	.code = HF_VCPU_RUN_NOTIFY_WAITERS,
				579	};
				580
				581	if (list_empty(&vm->mailbox.waiter_list)) {
				582	/* No waiters, nothing else to do. */
				583	return 0;
				584	}
				585
				586	if (vm->id == HF_PRIMARY_VM_ID) {
				587	/* The caller is the primary VM. Tell it to wake up waiters. */
				588	return 1;
				589	}
				590
				591	/*
				592	* Switch back to the primary VM, informing it that there are waiters
				593	* that need to be notified.
				594	*/
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	595	*next = api_switch_to_primary(current, ret, VCPU_STATE_READY);
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	596
				597	return 0;
				598	}
				599
				600	/**
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	601	* Configures the hypervisor's stage-1 view of the send and receive pages. The
				602	* stage-1 page tables must be locked so memory cannot be taken by another core
				603	* which could result in this transaction being unable to roll back in the case
				604	* of an error.
				605	*/
				606	static bool api_vm_configure_stage1(struct vm_locked vm_locked,
				607	paddr_t pa_send_begin, paddr_t pa_send_end,
				608	paddr_t pa_recv_begin, paddr_t pa_recv_end,
				609	struct mpool *local_page_pool)
				610	{
				611	bool ret;
				612	struct mm_stage1_locked mm_stage1_locked = mm_lock_stage1();
				613
				614	/* Map the send page as read-only in the hypervisor address space. */
				615	vm_locked.vm->mailbox.send =
				616	mm_identity_map(mm_stage1_locked, pa_send_begin, pa_send_end,
				617	MM_MODE_R, local_page_pool);
				618	if (!vm_locked.vm->mailbox.send) {
				619	/* TODO: partial defrag of failed range. */
				620	/* Recover any memory consumed in failed mapping. */
				621	mm_defrag(mm_stage1_locked, local_page_pool);
				622	goto fail;
				623	}
				624
				625	/*
				626	* Map the receive page as writable in the hypervisor address space. On
				627	* failure, unmap the send page before returning.
				628	*/
				629	vm_locked.vm->mailbox.recv =
				630	mm_identity_map(mm_stage1_locked, pa_recv_begin, pa_recv_end,
				631	MM_MODE_W, local_page_pool);
				632	if (!vm_locked.vm->mailbox.recv) {
				633	/* TODO: partial defrag of failed range. */
				634	/* Recover any memory consumed in failed mapping. */
				635	mm_defrag(mm_stage1_locked, local_page_pool);
				636	goto fail_undo_send;
				637	}
				638
				639	ret = true;
				640	goto out;
				641
				642	/*
				643	* The following mappings will not require more memory than is available
				644	* in the local pool.
				645	*/
				646	fail_undo_send:
				647	vm_locked.vm->mailbox.send = NULL;
Andrew Scull	7e8de32	2019-07-02 13:00:56 +0100	[diff] [blame]	648	CHECK(mm_unmap(mm_stage1_locked, pa_send_begin, pa_send_end,
				649	local_page_pool));
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	650
				651	fail:
				652	ret = false;
				653
				654	out:
				655	mm_unlock_stage1(&mm_stage1_locked);
				656
				657	return ret;
				658	}
				659
				660	/**
				661	* Configures the send and receive pages in the VM stage-2 and hypervisor
				662	* stage-1 page tables. Locking of the page tables combined with a local memory
				663	* pool ensures there will always be enough memory to recover from any errors
				664	* that arise.
				665	*/
				666	static bool api_vm_configure_pages(struct vm_locked vm_locked,
				667	paddr_t pa_send_begin, paddr_t pa_send_end,
				668	int orig_send_mode, paddr_t pa_recv_begin,
				669	paddr_t pa_recv_end, int orig_recv_mode)
				670	{
				671	bool ret;
				672	struct mpool local_page_pool;
				673
				674	/*
				675	* Create a local pool so any freed memory can't be used by another
				676	* thread. This is to ensure the original mapping can be restored if any
				677	* stage of the process fails.
				678	*/
				679	mpool_init_with_fallback(&local_page_pool, &api_page_pool);
				680
				681	/* Take memory ownership away from the VM and mark as shared. */
				682	if (!mm_vm_identity_map(
				683	&vm_locked.vm->ptable, pa_send_begin, pa_send_end,
				684	MM_MODE_UNOWNED \| MM_MODE_SHARED \| MM_MODE_R \| MM_MODE_W,
				685	NULL, &local_page_pool)) {
				686	goto fail;
				687	}
				688
				689	if (!mm_vm_identity_map(&vm_locked.vm->ptable, pa_recv_begin,
				690	pa_recv_end,
				691	MM_MODE_UNOWNED \| MM_MODE_SHARED \| MM_MODE_R,
				692	NULL, &local_page_pool)) {
				693	/* TODO: partial defrag of failed range. */
				694	/* Recover any memory consumed in failed mapping. */
				695	mm_vm_defrag(&vm_locked.vm->ptable, &local_page_pool);
				696	goto fail_undo_send;
				697	}
				698
				699	if (!api_vm_configure_stage1(vm_locked, pa_send_begin, pa_send_end,
				700	pa_recv_begin, pa_recv_end,
				701	&local_page_pool)) {
				702	goto fail_undo_send_and_recv;
				703	}
				704
				705	ret = true;
				706	goto out;
				707
				708	/*
				709	* The following mappings will not require more memory than is available
				710	* in the local pool.
				711	*/
				712	fail_undo_send_and_recv:
Andrew Scull	7e8de32	2019-07-02 13:00:56 +0100	[diff] [blame]	713	CHECK(mm_vm_identity_map(&vm_locked.vm->ptable, pa_recv_begin,
				714	pa_recv_end, orig_recv_mode, NULL,
				715	&local_page_pool));
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	716
				717	fail_undo_send:
Andrew Scull	7e8de32	2019-07-02 13:00:56 +0100	[diff] [blame]	718	CHECK(mm_vm_identity_map(&vm_locked.vm->ptable, pa_send_begin,
				719	pa_send_end, orig_send_mode, NULL,
				720	&local_page_pool));
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	721
				722	fail:
				723	ret = false;
				724
				725	out:
				726	mpool_fini(&local_page_pool);
				727
				728	return ret;
				729	}
				730
				731	/**
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	732	* Configures the VM to send/receive data through the specified pages. The pages
				733	* must not be shared.
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	734	*
				735	* Returns:
				736	* - -1 on failure.
				737	* - 0 on success if no further action is needed.
				738	* - 1 if it was called by the primary VM and the primary VM now needs to wake
				739	* up or kick waiters. Waiters should be retrieved by calling
				740	* hf_mailbox_waiter_get.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	741	*/
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	742	int64_t api_vm_configure(ipaddr_t send, ipaddr_t recv, struct vcpu *current,
				743	struct vcpu **next)
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	744	{
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	745	struct vm *vm = current->vm;
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	746	struct vm_locked vm_locked;
Andrew Scull	8087132	2018-08-06 12:04:09 +0100	[diff] [blame]	747	paddr_t pa_send_begin;
				748	paddr_t pa_send_end;
				749	paddr_t pa_recv_begin;
				750	paddr_t pa_recv_end;
Andrew Scull	220e621	2018-12-21 18:09:00 +0000	[diff] [blame]	751	int orig_send_mode;
				752	int orig_recv_mode;
Andrew Scull	c0e569a	2018-10-02 18:05:21 +0100	[diff] [blame]	753	int64_t ret;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	754
				755	/* Fail if addresses are not page-aligned. */
Alfredo Mazzinghi	eb1997c	2019-02-07 18:00:01 +0000	[diff] [blame]	756	if (!is_aligned(ipa_addr(send), PAGE_SIZE) \|\|
				757	!is_aligned(ipa_addr(recv), PAGE_SIZE)) {
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	758	return -1;
				759	}
				760
Andrew Scull	c2eb6a3	2018-12-13 16:54:24 +0000	[diff] [blame]	761	/* Convert to physical addresses. */
				762	pa_send_begin = pa_from_ipa(send);
				763	pa_send_end = pa_add(pa_send_begin, PAGE_SIZE);
				764
				765	pa_recv_begin = pa_from_ipa(recv);
				766	pa_recv_end = pa_add(pa_recv_begin, PAGE_SIZE);
				767
Andrew Scull	c9ccb3f	2018-08-13 15:27:12 +0100	[diff] [blame]	768	/* Fail if the same page is used for the send and receive pages. */
				769	if (pa_addr(pa_send_begin) == pa_addr(pa_recv_begin)) {
Andrew Scull	220e621	2018-12-21 18:09:00 +0000	[diff] [blame]	770	return -1;
				771	}
				772
Andrew Scull	3c0a90a	2019-07-01 11:55:53 +0100	[diff] [blame]	773	/*
				774	* The hypervisor's memory map must be locked for the duration of this
				775	* operation to ensure there will be sufficient memory to recover from
				776	* any failures.
				777	*
				778	* TODO: the scope of the can be reduced but will require restructuring
				779	* to keep a single unlock point.
				780	*/
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	781	vm_locked = vm_lock(vm);
Andrew Scull	220e621	2018-12-21 18:09:00 +0000	[diff] [blame]	782
				783	/* We only allow these to be setup once. */
				784	if (vm->mailbox.send \|\| vm->mailbox.recv) {
				785	goto fail;
				786	}
				787
				788	/*
				789	* Ensure the pages are valid, owned and exclusive to the VM and that
				790	* the VM has the required access to the memory.
				791	*/
				792	if (!mm_vm_get_mode(&vm->ptable, send, ipa_add(send, PAGE_SIZE),
				793	&orig_send_mode) \|\|
				794	!api_mode_valid_owned_and_exclusive(orig_send_mode) \|\|
				795	(orig_send_mode & MM_MODE_R) == 0 \|\|
				796	(orig_send_mode & MM_MODE_W) == 0) {
				797	goto fail;
				798	}
				799
				800	if (!mm_vm_get_mode(&vm->ptable, recv, ipa_add(recv, PAGE_SIZE),
				801	&orig_recv_mode) \|\|
				802	!api_mode_valid_owned_and_exclusive(orig_recv_mode) \|\|
				803	(orig_recv_mode & MM_MODE_R) == 0) {
				804	goto fail;
				805	}
				806
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	807	if (!api_vm_configure_pages(vm_locked, pa_send_begin, pa_send_end,
				808	orig_send_mode, pa_recv_begin, pa_recv_end,
				809	orig_recv_mode)) {
				810	goto fail;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	811	}
				812
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	813	/* Tell caller about waiters, if any. */
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	814	ret = api_waiter_result(vm_locked, current, next);
Andrew Scull	220e621	2018-12-21 18:09:00 +0000	[diff] [blame]	815	goto exit;
				816
Andrew Scull	220e621	2018-12-21 18:09:00 +0000	[diff] [blame]	817	fail:
				818	ret = -1;
				819
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	820	exit:
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	821	vm_unlock(&vm_locked);
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	822
				823	return ret;
				824	}
				825
				826	/**
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	827	* Copies data from the sender's send buffer to the recipient's receive buffer
				828	* and notifies the recipient.
Wedson Almeida Filho	17c997f	2019-01-09 18:50:09 +0000	[diff] [blame]	829	*
				830	* If the recipient's receive buffer is busy, it can optionally register the
				831	* caller to be notified when the recipient's receive buffer becomes available.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	832	*/
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	833	int32_t api_spci_msg_send(uint32_t attributes, struct vcpu *current,
				834	struct vcpu **next)
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	835	{
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	836	struct vm *from = current->vm;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	837	struct vm *to;
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	838	struct hf_vcpu_run_return primary_ret = {
				839	.code = HF_VCPU_RUN_MESSAGE,
				840	};
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	841	struct spci_message from_msg_replica;
				842	struct spci_message *to_msg;
				843	const struct spci_message *from_msg;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	844
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	845	uint32_t size;
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	846
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	847	int64_t ret;
				848	bool notify = (attributes & SPCI_MSG_SEND_NOTIFY_MASK) ==
				849	SPCI_MSG_SEND_NOTIFY;
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	850
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	851	/*
				852	* Check that the sender has configured its send buffer. Copy the
				853	* message header. If the tx mailbox at from_msg is configured (i.e.
				854	* from_msg != NULL) then it can be safely accessed after releasing the
				855	* lock since the tx mailbox address can only be configured once.
				856	*/
				857	sl_lock(&from->lock);
				858	from_msg = from->mailbox.send;
				859	sl_unlock(&from->lock);
				860
				861	if (from_msg == NULL) {
				862	return SPCI_INVALID_PARAMETERS;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	863	}
				864
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	865	/*
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	866	* Note that the payload is not copied when the message header is.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	867	*/
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	868	from_msg_replica = *from_msg;
				869
				870	/* Ensure source VM id corresponds to the current VM. */
				871	if (from_msg_replica.source_vm_id != from->id) {
				872	return SPCI_INVALID_PARAMETERS;
				873	}
				874
				875	size = from_msg_replica.length;
				876	/* Limit the size of transfer. */
Andrew Scull	1262ac2	2019-04-05 12:44:26 +0100	[diff] [blame]	877	if (size > SPCI_MSG_PAYLOAD_MAX) {
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	878	return SPCI_INVALID_PARAMETERS;
				879	}
				880
				881	/* Disallow reflexive requests as this suggests an error in the VM. */
				882	if (from_msg_replica.target_vm_id == from->id) {
				883	return SPCI_INVALID_PARAMETERS;
				884	}
				885
				886	/* Ensure the target VM exists. */
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	887	to = vm_find(from_msg_replica.target_vm_id);
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	888	if (to == NULL) {
				889	return SPCI_INVALID_PARAMETERS;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	890	}
				891
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	892	sl_lock(&to->lock);
				893
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	894	if (to->mailbox.state != MAILBOX_STATE_EMPTY \|\|
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	895	to->mailbox.recv == NULL) {
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	896	/*
				897	* Fail if the target isn't currently ready to receive data,
				898	* setting up for notification if requested.
				899	*/
				900	if (notify) {
Wedson Almeida Filho	b790f65	2019-01-22 23:41:56 +0000	[diff] [blame]	901	struct wait_entry *entry =
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	902	&current->vm->wait_entries
				903	[from_msg_replica.target_vm_id];
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	904
				905	/* Append waiter only if it's not there yet. */
				906	if (list_empty(&entry->wait_links)) {
				907	list_append(&to->mailbox.waiter_list,
				908	&entry->wait_links);
				909	}
				910	}
				911
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	912	ret = SPCI_BUSY;
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	913	goto out;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	914	}
				915
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	916	/* Copy data. */
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	917	to_msg = to->mailbox.recv;
				918	*to_msg = from_msg_replica;
Andrew Scull	a1aa2ba	2019-04-05 11:49:02 +0100	[diff] [blame]	919	memcpy_s(to_msg->payload, SPCI_MSG_PAYLOAD_MAX,
				920	from->mailbox.send->payload, size);
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	921	primary_ret.message.vm_id = to->id;
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	922	ret = SPCI_SUCCESS;
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	923
				924	/* Messages for the primary VM are delivered directly. */
				925	if (to->id == HF_PRIMARY_VM_ID) {
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	926	to->mailbox.state = MAILBOX_STATE_READ;
Wedson Almeida Filho	ba641ef	2018-12-03 04:19:44 +0000	[diff] [blame]	927	*next = api_switch_to_primary(current, primary_ret,
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	928	VCPU_STATE_READY);
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	929	goto out;
				930	}
				931
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	932	to->mailbox.state = MAILBOX_STATE_RECEIVED;
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	933
				934	/* Return to the primary VM directly or with a switch. */
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	935	if (from->id != HF_PRIMARY_VM_ID) {
Wedson Almeida Filho	ba641ef	2018-12-03 04:19:44 +0000	[diff] [blame]	936	*next = api_switch_to_primary(current, primary_ret,
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	937	VCPU_STATE_READY);
Wedson Almeida Filho	80eb4a3	2018-11-30 17:11:15 +0000	[diff] [blame]	938	}
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	939
				940	out:
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	941	sl_unlock(&to->lock);
				942
Wedson Almeida Filho	80eb4a3	2018-11-30 17:11:15 +0000	[diff] [blame]	943	return ret;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	944	}
				945
				946	/**
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	947	* Receives a message from the mailbox. If one isn't available, this function
				948	* can optionally block the caller until one becomes available.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	949	*
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	950	* No new messages can be received until the mailbox has been cleared.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	951	*/
Jose Marinho	3e2442f	2019-03-12 13:30:37 +0000	[diff] [blame]	952	int32_t api_spci_msg_recv(uint32_t attributes, struct vcpu *current,
				953	struct vcpu **next)
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	954	{
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	955	struct vm *vm = current->vm;
Jose Marinho	3e2442f	2019-03-12 13:30:37 +0000	[diff] [blame]	956	int32_t return_code;
				957	bool block =
				958	(attributes & SPCI_MSG_RECV_BLOCK_MASK) == SPCI_MSG_RECV_BLOCK;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	959
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	960	/*
				961	* The primary VM will receive messages as a status code from running
				962	* vcpus and must not call this function.
				963	*/
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	964	if (vm->id == HF_PRIMARY_VM_ID) {
Jose Marinho	3e2442f	2019-03-12 13:30:37 +0000	[diff] [blame]	965	return SPCI_INTERRUPTED;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	966	}
				967
				968	sl_lock(&vm->lock);
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	969
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	970	/* Return pending messages without blocking. */
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	971	if (vm->mailbox.state == MAILBOX_STATE_RECEIVED) {
				972	vm->mailbox.state = MAILBOX_STATE_READ;
Jose Marinho	3e2442f	2019-03-12 13:30:37 +0000	[diff] [blame]	973	return_code = SPCI_SUCCESS;
				974	goto out;
				975	}
				976
				977	/* No pending message so fail if not allowed to block. */
				978	if (!block) {
				979	return_code = SPCI_RETRY;
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	980	goto out;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	981	}
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	982
Andrew Walbran	9311c9a	2019-03-12 16:59:04 +0000	[diff] [blame]	983	/*
Jose Marinho	3e2442f	2019-03-12 13:30:37 +0000	[diff] [blame]	984	* From this point onward this call can only be interrupted or a message
				985	* received. If a message is received the return value will be set at
				986	* that time to SPCI_SUCCESS.
Andrew Walbran	9311c9a	2019-03-12 16:59:04 +0000	[diff] [blame]	987	*/
Jose Marinho	3e2442f	2019-03-12 13:30:37 +0000	[diff] [blame]	988	return_code = SPCI_INTERRUPTED;
				989
				990	/*
				991	* Don't block if there are enabled and pending interrupts, to match
				992	* behaviour of wait_for_interrupt.
				993	*/
				994	if (current->interrupts.enabled_and_pending_count > 0) {
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	995	goto out;
				996	}
				997
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	998	/* Switch back to primary vm to block. */
Andrew Walbran	b481655	2018-12-05 17:35:42 +0000	[diff] [blame]	999	{
				1000	struct hf_vcpu_run_return run_return = {
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	1001	.code = HF_VCPU_RUN_WAIT_FOR_MESSAGE,
Andrew Walbran	b481655	2018-12-05 17:35:42 +0000	[diff] [blame]	1002	};
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1003
Andrew Walbran	b481655	2018-12-05 17:35:42 +0000	[diff] [blame]	1004	*next = api_switch_to_primary(current, run_return,
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	1005	VCPU_STATE_BLOCKED_MAILBOX);
Andrew Walbran	b481655	2018-12-05 17:35:42 +0000	[diff] [blame]	1006	}
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	1007	out:
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1008	sl_unlock(&vm->lock);
				1009
Jose Marinho	3e2442f	2019-03-12 13:30:37 +0000	[diff] [blame]	1010	return return_code;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1011	}
				1012
				1013	/**
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1014	* Retrieves the next VM whose mailbox became writable. For a VM to be notified
				1015	* by this function, the caller must have called api_mailbox_send before with
				1016	* the notify argument set to true, and this call must have failed because the
				1017	* mailbox was not available.
				1018	*
				1019	* It should be called repeatedly to retrieve a list of VMs.
				1020	*
				1021	* Returns -1 if no VM became writable, or the id of the VM whose mailbox
				1022	* became writable.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1023	*/
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1024	int64_t api_mailbox_writable_get(const struct vcpu *current)
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1025	{
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	1026	struct vm *vm = current->vm;
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1027	struct wait_entry *entry;
Andrew Scull	c0e569a	2018-10-02 18:05:21 +0100	[diff] [blame]	1028	int64_t ret;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1029
				1030	sl_lock(&vm->lock);
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1031	if (list_empty(&vm->mailbox.ready_list)) {
				1032	ret = -1;
				1033	goto exit;
				1034	}
				1035
				1036	entry = CONTAINER_OF(vm->mailbox.ready_list.next, struct wait_entry,
				1037	ready_links);
				1038	list_remove(&entry->ready_links);
Wedson Almeida Filho	b790f65	2019-01-22 23:41:56 +0000	[diff] [blame]	1039	ret = entry - vm->wait_entries;
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1040
				1041	exit:
				1042	sl_unlock(&vm->lock);
				1043	return ret;
				1044	}
				1045
				1046	/**
				1047	* Retrieves the next VM waiting to be notified that the mailbox of the
				1048	* specified VM became writable. Only primary VMs are allowed to call this.
				1049	*
Wedson Almeida Filho	b790f65	2019-01-22 23:41:56 +0000	[diff] [blame]	1050	* Returns -1 on failure or if there are no waiters; the VM id of the next
				1051	* waiter otherwise.
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1052	*/
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1053	int64_t api_mailbox_waiter_get(spci_vm_id_t vm_id, const struct vcpu *current)
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1054	{
				1055	struct vm *vm;
				1056	struct vm_locked locked;
				1057	struct wait_entry *entry;
				1058	struct vm *waiting_vm;
				1059
				1060	/* Only primary VMs are allowed to call this function. */
				1061	if (current->vm->id != HF_PRIMARY_VM_ID) {
				1062	return -1;
				1063	}
				1064
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1065	vm = vm_find(vm_id);
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1066	if (vm == NULL) {
				1067	return -1;
				1068	}
				1069
				1070	/* Check if there are outstanding notifications from given vm. */
Andrew Walbran	7e932bd	2019-04-29 16:47:06 +0100	[diff] [blame]	1071	locked = vm_lock(vm);
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1072	entry = api_fetch_waiter(locked);
				1073	vm_unlock(&locked);
				1074
				1075	if (entry == NULL) {
				1076	return -1;
				1077	}
				1078
				1079	/* Enqueue notification to waiting VM. */
				1080	waiting_vm = entry->waiting_vm;
				1081
				1082	sl_lock(&waiting_vm->lock);
				1083	if (list_empty(&entry->ready_links)) {
				1084	list_append(&waiting_vm->mailbox.ready_list,
				1085	&entry->ready_links);
				1086	}
				1087	sl_unlock(&waiting_vm->lock);
				1088
				1089	return waiting_vm->id;
				1090	}
				1091
				1092	/**
				1093	* Clears the caller's mailbox so that a new message can be received. The caller
				1094	* must have copied out all data they wish to preserve as new messages will
				1095	* overwrite the old and will arrive asynchronously.
				1096	*
				1097	* Returns:
Andrew Scull	aa7db8e	2019-02-01 14:12:19 +0000	[diff] [blame]	1098	* - -1 on failure, if the mailbox hasn't been read.
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1099	* - 0 on success if no further action is needed.
				1100	* - 1 if it was called by the primary VM and the primary VM now needs to wake
				1101	* up or kick waiters. Waiters should be retrieved by calling
				1102	* hf_mailbox_waiter_get.
				1103	*/
				1104	int64_t api_mailbox_clear(struct vcpu current, struct vcpu *next)
				1105	{
				1106	struct vm *vm = current->vm;
				1107	struct vm_locked locked;
				1108	int64_t ret;
				1109
Andrew Walbran	7e932bd	2019-04-29 16:47:06 +0100	[diff] [blame]	1110	locked = vm_lock(vm);
Andrew Scull	aa7db8e	2019-02-01 14:12:19 +0000	[diff] [blame]	1111	switch (vm->mailbox.state) {
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	1112	case MAILBOX_STATE_EMPTY:
Andrew Scull	aa7db8e	2019-02-01 14:12:19 +0000	[diff] [blame]	1113	ret = 0;
				1114	break;
				1115
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	1116	case MAILBOX_STATE_RECEIVED:
Andrew Scull	aa7db8e	2019-02-01 14:12:19 +0000	[diff] [blame]	1117	ret = -1;
				1118	break;
				1119
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	1120	case MAILBOX_STATE_READ:
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1121	ret = api_waiter_result(locked, current, next);
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	1122	vm->mailbox.state = MAILBOX_STATE_EMPTY;
Andrew Scull	aa7db8e	2019-02-01 14:12:19 +0000	[diff] [blame]	1123	break;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1124	}
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1125	vm_unlock(&locked);
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1126
				1127	return ret;
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	1128	}
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1129
				1130	/**
				1131	* Enables or disables a given interrupt ID for the calling vCPU.
				1132	*
				1133	* Returns 0 on success, or -1 if the intid is invalid.
				1134	*/
Wedson Almeida Filho	c559d13	2019-01-09 19:33:40 +0000	[diff] [blame]	1135	int64_t api_interrupt_enable(uint32_t intid, bool enable, struct vcpu *current)
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1136	{
				1137	uint32_t intid_index = intid / INTERRUPT_REGISTER_BITS;
				1138	uint32_t intid_mask = 1u << (intid % INTERRUPT_REGISTER_BITS);
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1139
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1140	if (intid >= HF_NUM_INTIDS) {
				1141	return -1;
				1142	}
				1143
				1144	sl_lock(&current->lock);
				1145	if (enable) {
Andrew Walbran	3d84a26	2018-12-13 14:41:19 +0000	[diff] [blame]	1146	/*
				1147	* If it is pending and was not enabled before, increment the
				1148	* count.
				1149	*/
				1150	if (current->interrupts.interrupt_pending[intid_index] &
				1151	~current->interrupts.interrupt_enabled[intid_index] &
				1152	intid_mask) {
				1153	current->interrupts.enabled_and_pending_count++;
				1154	}
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1155	current->interrupts.interrupt_enabled[intid_index] \|=
				1156	intid_mask;
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1157	} else {
Andrew Walbran	3d84a26	2018-12-13 14:41:19 +0000	[diff] [blame]	1158	/*
				1159	* If it is pending and was enabled before, decrement the count.
				1160	*/
				1161	if (current->interrupts.interrupt_pending[intid_index] &
				1162	current->interrupts.interrupt_enabled[intid_index] &
				1163	intid_mask) {
				1164	current->interrupts.enabled_and_pending_count--;
				1165	}
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1166	current->interrupts.interrupt_enabled[intid_index] &=
				1167	~intid_mask;
				1168	}
				1169
				1170	sl_unlock(&current->lock);
				1171	return 0;
				1172	}
				1173
				1174	/**
				1175	* Returns the ID of the next pending interrupt for the calling vCPU, and
				1176	* acknowledges it (i.e. marks it as no longer pending). Returns
				1177	* HF_INVALID_INTID if there are no pending interrupts.
				1178	*/
Wedson Almeida Filho	c559d13	2019-01-09 19:33:40 +0000	[diff] [blame]	1179	uint32_t api_interrupt_get(struct vcpu *current)
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1180	{
				1181	uint8_t i;
				1182	uint32_t first_interrupt = HF_INVALID_INTID;
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1183
				1184	/*
				1185	* Find the first enabled and pending interrupt ID, return it, and
				1186	* deactivate it.
				1187	*/
				1188	sl_lock(&current->lock);
				1189	for (i = 0; i < HF_NUM_INTIDS / INTERRUPT_REGISTER_BITS; ++i) {
				1190	uint32_t enabled_and_pending =
				1191	current->interrupts.interrupt_enabled[i] &
				1192	current->interrupts.interrupt_pending[i];
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1193
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1194	if (enabled_and_pending != 0) {
Andrew Walbran	3d84a26	2018-12-13 14:41:19 +0000	[diff] [blame]	1195	uint8_t bit_index = ctz(enabled_and_pending);
				1196	/*
				1197	* Mark it as no longer pending and decrement the count.
				1198	*/
				1199	current->interrupts.interrupt_pending[i] &=
				1200	~(1u << bit_index);
				1201	current->interrupts.enabled_and_pending_count--;
				1202	first_interrupt =
				1203	i * INTERRUPT_REGISTER_BITS + bit_index;
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1204	break;
				1205	}
				1206	}
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1207
				1208	sl_unlock(&current->lock);
				1209	return first_interrupt;
				1210	}
				1211
				1212	/**
Andrew Walbran	4cf217a	2018-12-14 15:24:50 +0000	[diff] [blame]	1213	* Returns whether the current vCPU is allowed to inject an interrupt into the
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1214	* given VM and vCPU.
				1215	*/
				1216	static inline bool is_injection_allowed(uint32_t target_vm_id,
				1217	struct vcpu *current)
				1218	{
				1219	uint32_t current_vm_id = current->vm->id;
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1220
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1221	/*
				1222	* The primary VM is allowed to inject interrupts into any VM. Secondary
				1223	* VMs are only allowed to inject interrupts into their own vCPUs.
				1224	*/
				1225	return current_vm_id == HF_PRIMARY_VM_ID \|\|
				1226	current_vm_id == target_vm_id;
				1227	}
				1228
				1229	/**
				1230	* Injects a virtual interrupt of the given ID into the given target vCPU.
				1231	* This doesn't cause the vCPU to actually be run immediately; it will be taken
				1232	* when the vCPU is next run, which is up to the scheduler.
				1233	*
Andrew Walbran	3d84a26	2018-12-13 14:41:19 +0000	[diff] [blame]	1234	* Returns:
				1235	* - -1 on failure because the target VM or vCPU doesn't exist, the interrupt
				1236	* ID is invalid, or the current VM is not allowed to inject interrupts to
				1237	* the target VM.
				1238	* - 0 on success if no further action is needed.
				1239	* - 1 if it was called by the primary VM and the primary VM now needs to wake
				1240	* up or kick the target vCPU.
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1241	*/
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1242	int64_t api_interrupt_inject(spci_vm_id_t target_vm_id,
Andrew Walbran	b037d5b	2019-06-25 17:19:41 +0100	[diff] [blame]	1243	spci_vcpu_index_t target_vcpu_idx, uint32_t intid,
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1244	struct vcpu current, struct vcpu *next)
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1245	{
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1246	struct vcpu *target_vcpu;
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1247	struct vm *target_vm = vm_find(target_vm_id);
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1248
				1249	if (intid >= HF_NUM_INTIDS) {
				1250	return -1;
				1251	}
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1252
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1253	if (target_vm == NULL) {
				1254	return -1;
				1255	}
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1256
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1257	if (target_vcpu_idx >= target_vm->vcpu_count) {
				1258	/* The requested vcpu must exist. */
				1259	return -1;
				1260	}
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1261
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1262	if (!is_injection_allowed(target_vm_id, current)) {
				1263	return -1;
				1264	}
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1265
Andrew Walbran	e1310df	2019-04-29 17:28:28 +0100	[diff] [blame]	1266	target_vcpu = vm_get_vcpu(target_vm, target_vcpu_idx);
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1267
				1268	dlog("Injecting IRQ %d for VM %d VCPU %d from VM %d VCPU %d\n", intid,
				1269	target_vm_id, target_vcpu_idx, current->vm->id, current->cpu->id);
Andrew Walbran	fc9d438	2019-05-10 18:07:21 +0100	[diff] [blame]	1270	return internal_interrupt_inject(target_vcpu, intid, current, next);
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1271	}
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1272
				1273	/**
				1274	* Clears a region of physical memory by overwriting it with zeros. The data is
				1275	* flushed from the cache so the memory has been cleared across the system.
				1276	*/
				1277	static bool api_clear_memory(paddr_t begin, paddr_t end, struct mpool *ppool)
				1278	{
				1279	/*
				1280	* TODO: change this to a cpu local single page window rather than a
				1281	* global mapping of the whole range. Such an approach will limit
				1282	* the changes to stage-1 tables and will allow only local
				1283	* invalidation.
				1284	*/
Andrew Scull	3c0a90a	2019-07-01 11:55:53 +0100	[diff] [blame]	1285	bool ret;
				1286	struct mm_stage1_locked stage1_locked = mm_lock_stage1();
				1287	void *ptr =
				1288	mm_identity_map(stage1_locked, begin, end, MM_MODE_W, ppool);
Andrew Walbran	2cb4339	2019-04-17 12:52:45 +0100	[diff] [blame]	1289	size_t size = pa_difference(begin, end);
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1290
				1291	if (!ptr) {
				1292	/* TODO: partial defrag of failed range. */
				1293	/* Recover any memory consumed in failed mapping. */
Andrew Scull	3c0a90a	2019-07-01 11:55:53 +0100	[diff] [blame]	1294	mm_defrag(stage1_locked, ppool);
				1295	goto fail;
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1296	}
				1297
Andrew Scull	2b5fbad	2019-04-05 13:55:56 +0100	[diff] [blame]	1298	memset_s(ptr, size, 0, size);
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1299	arch_mm_write_back_dcache(ptr, size);
Andrew Scull	3c0a90a	2019-07-01 11:55:53 +0100	[diff] [blame]	1300	mm_unmap(stage1_locked, begin, end, ppool);
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1301
Andrew Scull	3c0a90a	2019-07-01 11:55:53 +0100	[diff] [blame]	1302	ret = true;
				1303	goto out;
				1304
				1305	fail:
				1306	ret = false;
				1307
				1308	out:
				1309	mm_unlock_stage1(&stage1_locked);
				1310
				1311	return ret;
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1312	}
				1313
				1314	/**
				1315	* Shares memory from the calling VM with another. The memory can be shared in
				1316	* different modes.
				1317	*
				1318	* TODO: the interface for sharing memory will need to be enhanced to allow
				1319	* sharing with different modes e.g. read-only, informing the recipient
				1320	* of the memory they have been given, opting to not wipe the memory and
				1321	* possibly allowing multiple blocks to be transferred. What this will
				1322	* look like is TBD.
				1323	*/
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1324	int64_t api_share_memory(spci_vm_id_t vm_id, ipaddr_t addr, size_t size,
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1325	enum hf_share share, struct vcpu *current)
				1326	{
				1327	struct vm *from = current->vm;
				1328	struct vm *to;
				1329	int orig_from_mode;
				1330	int from_mode;
				1331	int to_mode;
				1332	ipaddr_t begin;
				1333	ipaddr_t end;
				1334	paddr_t pa_begin;
				1335	paddr_t pa_end;
				1336	struct mpool local_page_pool;
				1337	int64_t ret;
				1338
				1339	/* Disallow reflexive shares as this suggests an error in the VM. */
				1340	if (vm_id == from->id) {
				1341	return -1;
				1342	}
				1343
				1344	/* Ensure the target VM exists. */
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1345	to = vm_find(vm_id);
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1346	if (to == NULL) {
				1347	return -1;
				1348	}
				1349
				1350	begin = addr;
				1351	end = ipa_add(addr, size);
				1352
				1353	/* Fail if addresses are not page-aligned. */
Alfredo Mazzinghi	eb1997c	2019-02-07 18:00:01 +0000	[diff] [blame]	1354	if (!is_aligned(ipa_addr(begin), PAGE_SIZE) \|\|
				1355	!is_aligned(ipa_addr(end), PAGE_SIZE)) {
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1356	return -1;
				1357	}
				1358
				1359	/* Convert the sharing request to memory management modes. */
				1360	switch (share) {
				1361	case HF_MEMORY_GIVE:
				1362	from_mode = MM_MODE_INVALID \| MM_MODE_UNOWNED;
				1363	to_mode = MM_MODE_R \| MM_MODE_W \| MM_MODE_X;
				1364	break;
				1365
				1366	case HF_MEMORY_LEND:
				1367	from_mode = MM_MODE_INVALID;
				1368	to_mode = MM_MODE_R \| MM_MODE_W \| MM_MODE_X \| MM_MODE_UNOWNED;
				1369	break;
				1370
				1371	case HF_MEMORY_SHARE:
				1372	from_mode = MM_MODE_R \| MM_MODE_W \| MM_MODE_X \| MM_MODE_SHARED;
				1373	to_mode = MM_MODE_R \| MM_MODE_W \| MM_MODE_X \| MM_MODE_UNOWNED \|
				1374	MM_MODE_SHARED;
				1375	break;
				1376
				1377	default:
				1378	/* The input is untrusted so might not be a valid value. */
				1379	return -1;
				1380	}
				1381
				1382	/*
				1383	* Create a local pool so any freed memory can't be used by another
				1384	* thread. This is to ensure the original mapping can be restored if any
				1385	* stage of the process fails.
				1386	*/
				1387	mpool_init_with_fallback(&local_page_pool, &api_page_pool);
				1388
				1389	sl_lock_both(&from->lock, &to->lock);
				1390
				1391	/*
				1392	* Ensure that the memory range is mapped with the same mode so that
				1393	* changes can be reverted if the process fails.
				1394	*/
				1395	if (!mm_vm_get_mode(&from->ptable, begin, end, &orig_from_mode)) {
				1396	goto fail;
				1397	}
				1398
				1399	/*
				1400	* Ensure the memory range is valid for the sender. If it isn't, the
				1401	* sender has either shared it with another VM already or has no claim
				1402	* to the memory.
				1403	*/
				1404	if (orig_from_mode & MM_MODE_INVALID) {
				1405	goto fail;
				1406	}
				1407
				1408	/*
				1409	* The sender must own the memory and have exclusive access to it in
				1410	* order to share it. Alternatively, it is giving memory back to the
				1411	* owning VM.
				1412	*/
				1413	if (orig_from_mode & MM_MODE_UNOWNED) {
				1414	int orig_to_mode;
				1415
				1416	if (share != HF_MEMORY_GIVE \|\|
				1417	!mm_vm_get_mode(&to->ptable, begin, end, &orig_to_mode) \|\|
				1418	orig_to_mode & MM_MODE_UNOWNED) {
				1419	goto fail;
				1420	}
				1421	} else if (orig_from_mode & MM_MODE_SHARED) {
				1422	goto fail;
				1423	}
				1424
				1425	pa_begin = pa_from_ipa(begin);
				1426	pa_end = pa_from_ipa(end);
				1427
				1428	/*
				1429	* First update the mapping for the sender so there is not overlap with
				1430	* the recipient.
				1431	*/
				1432	if (!mm_vm_identity_map(&from->ptable, pa_begin, pa_end, from_mode,
				1433	NULL, &local_page_pool)) {
				1434	goto fail;
				1435	}
				1436
				1437	/* Clear the memory so no VM or device can see the previous contents. */
				1438	if (!api_clear_memory(pa_begin, pa_end, &local_page_pool)) {
				1439	goto fail_return_to_sender;
				1440	}
				1441
				1442	/* Complete the transfer by mapping the memory into the recipient. */
				1443	if (!mm_vm_identity_map(&to->ptable, pa_begin, pa_end, to_mode, NULL,
				1444	&local_page_pool)) {
				1445	/* TODO: partial defrag of failed range. */
				1446	/* Recover any memory consumed in failed mapping. */
				1447	mm_vm_defrag(&from->ptable, &local_page_pool);
				1448	goto fail_return_to_sender;
				1449	}
				1450
				1451	ret = 0;
				1452	goto out;
				1453
				1454	fail_return_to_sender:
Andrew Scull	7e8de32	2019-07-02 13:00:56 +0100	[diff] [blame]	1455	CHECK(mm_vm_identity_map(&from->ptable, pa_begin, pa_end,
				1456	orig_from_mode, NULL, &local_page_pool));
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1457
				1458	fail:
				1459	ret = -1;
				1460
				1461	out:
				1462	sl_unlock(&from->lock);
				1463	sl_unlock(&to->lock);
				1464
				1465	mpool_fini(&local_page_pool);
				1466
				1467	return ret;
				1468	}
Jose Marinho	fc0b2b6	2019-06-06 11:18:45 +0100	[diff] [blame]	1469
				1470	/** Returns the version of the implemented SPCI specification. */
				1471	int32_t api_spci_version(void)
				1472	{
				1473	/*
				1474	* Ensure that both major and minor revision representation occupies at
				1475	* most 15 bits.
				1476	*/
				1477	static_assert(0x8000 > SPCI_VERSION_MAJOR,
				1478	"Major revision representation take more than 15 bits.");
				1479	static_assert(0x10000 > SPCI_VERSION_MINOR,
				1480	"Minor revision representation take more than 16 bits.");
				1481
				1482	return (SPCI_VERSION_MAJOR << SPCI_VERSION_MAJOR_OFFSET) \|
				1483	SPCI_VERSION_MINOR;
				1484	}