Blame - src/api.c - hafnium/hafnium.git - TrustedFirmware Git Browser

blob: 6f118a2ba08133119890d8c69fc0c91aac4e0ccd [file] [log] [blame]

Andrew Scull	1883487	2018-10-12 11:48:09 +0100	[diff] [blame]	1	/*
Andrew Walbran	692b325	2019-03-07 15:51:31 +0000	[diff] [blame]	2	* Copyright 2018 The Hafnium Authors.
Andrew Scull	1883487	2018-10-12 11:48:09 +0100	[diff] [blame]	3	*
				4	* Licensed under the Apache License, Version 2.0 (the "License");
				5	* you may not use this file except in compliance with the License.
				6	* You may obtain a copy of the License at
				7	*
				8	* https://www.apache.org/licenses/LICENSE-2.0
				9	*
				10	* Unless required by applicable law or agreed to in writing, software
				11	* distributed under the License is distributed on an "AS IS" BASIS,
				12	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
				13	* See the License for the specific language governing permissions and
				14	* limitations under the License.
				15	*/
				16
Andrew Scull	18c78fc	2018-08-20 12:57:41 +0100	[diff] [blame]	17	#include "hf/api.h"
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	18
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	19	#include "hf/arch/cpu.h"
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	20	#include "hf/arch/timer.h"
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	21
Andrew Scull	877ae4b	2019-07-02 12:52:33 +0100	[diff] [blame]	22	#include "hf/check.h"
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	23	#include "hf/dlog.h"
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	24	#include "hf/mm.h"
Andrew Walbran	c1ad4ce	2019-05-09 11:41:39 +0100	[diff] [blame]	25	#include "hf/plat/console.h"
Jose Marinho	40d55f3	2019-07-01 15:41:54 +0100	[diff] [blame]	26	#include "hf/spci_internal.h"
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	27	#include "hf/spinlock.h"
Andrew Scull	877ae4b	2019-07-02 12:52:33 +0100	[diff] [blame]	28	#include "hf/static_assert.h"
Andrew Scull	8d9e121	2019-04-05 13:52:55 +0100	[diff] [blame]	29	#include "hf/std.h"
Andrew Scull	18c78fc	2018-08-20 12:57:41 +0100	[diff] [blame]	30	#include "hf/vm.h"
				31
Andrew Scull	f35a5c9	2018-08-07 18:09:46 +0100	[diff] [blame]	32	#include "vmapi/hf/call.h"
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	33	#include "vmapi/hf/spci.h"
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	34
Wedson Almeida Filho	ba641ef	2018-12-03 04:19:44 +0000	[diff] [blame]	35	/*
				36	* To eliminate the risk of deadlocks, we define a partial order for the
				37	* acquisition of locks held concurrently by the same physical CPU. Our current
				38	* ordering requirements are as follows:
				39	*
Andrew Walbran	c1ad4ce	2019-05-09 11:41:39 +0100	[diff] [blame]	40	* vm::lock -> vcpu::lock -> mm_stage1_lock -> dlog sl
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	41	*
Andrew Scull	4caadaf	2019-07-03 13:13:47 +0100	[diff] [blame]	42	* Locks of the same kind require the lock of lowest address to be locked first,
				43	* see `sl_lock_both()`.
Wedson Almeida Filho	ba641ef	2018-12-03 04:19:44 +0000	[diff] [blame]	44	*/
				45
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	46	static_assert(HF_MAILBOX_SIZE == PAGE_SIZE,
Andrew Scull	13652af	2018-09-17 14:49:08 +0100	[diff] [blame]	47	"Currently, a page is mapped for the send and receive buffers so "
				48	"the maximum request is the size of a page.");
				49
Wedson Almeida Filho	9ed8da5	2018-12-17 16:09:11 +0000	[diff] [blame]	50	static struct mpool api_page_pool;
Wedson Almeida Filho	22d5eaa	2018-12-16 00:38:49 +0000	[diff] [blame]	51
				52	/**
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	53	* Initialises the API page pool by taking ownership of the contents of the
				54	* given page pool.
Wedson Almeida Filho	22d5eaa	2018-12-16 00:38:49 +0000	[diff] [blame]	55	*/
				56	void api_init(struct mpool *ppool)
				57	{
Wedson Almeida Filho	9ed8da5	2018-12-17 16:09:11 +0000	[diff] [blame]	58	mpool_init_from(&api_page_pool, ppool);
Wedson Almeida Filho	22d5eaa	2018-12-16 00:38:49 +0000	[diff] [blame]	59	}
				60
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	61	/**
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	62	* Switches the physical CPU back to the corresponding vcpu of the primary VM.
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	63	*
				64	* This triggers the scheduling logic to run. Run in the context of secondary VM
Andrew Walbran	f0c314d	2019-10-02 14:24:26 +0100	[diff] [blame]	65	* to cause SPCI_RUN to return and the primary VM to regain control of the CPU.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	66	*/
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	67	static struct vcpu api_switch_to_primary(struct vcpu current,
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	68	struct spci_value primary_ret,
Wedson Almeida Filho	ba641ef	2018-12-03 04:19:44 +0000	[diff] [blame]	69	enum vcpu_state secondary_state)
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	70	{
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	71	struct vm *primary = vm_find(HF_PRIMARY_VM_ID);
Andrew Walbran	e1310df	2019-04-29 17:28:28 +0100	[diff] [blame]	72	struct vcpu *next = vm_get_vcpu(primary, cpu_index(current->cpu));
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	73
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	74	/*
				75	* If the secondary is blocked but has a timer running, sleep until the
				76	* timer fires rather than indefinitely.
				77	*/
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	78	switch (primary_ret.func) {
				79	case HF_SPCI_RUN_WAIT_FOR_INTERRUPT:
				80	case SPCI_MSG_WAIT_32: {
				81	if (arch_timer_enabled_current()) {
				82	uint64_t remaining_ns =
				83	arch_timer_remaining_ns_current();
				84
				85	if (remaining_ns == 0) {
				86	/*
				87	* Timer is pending, so the current vCPU should
				88	* be run again right away.
				89	*/
				90	primary_ret.func = SPCI_INTERRUPT_32;
				91	/*
				92	* primary_ret.arg1 should already be set to the
				93	* current VM ID and vCPU ID.
				94	*/
				95	primary_ret.arg2 = 0;
				96	} else {
				97	primary_ret.arg2 = remaining_ns;
				98	}
				99	} else {
				100	primary_ret.arg2 = SPCI_SLEEP_INDEFINITE;
				101	}
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	102	break;
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	103	}
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	104
				105	default:
				106	/* Do nothing. */
				107	break;
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	108	}
				109
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	110	/* Set the return value for the primary VM's call to HF_VCPU_RUN. */
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	111	arch_regs_set_retval(&next->regs, primary_ret);
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	112
Wedson Almeida Filho	ba641ef	2018-12-03 04:19:44 +0000	[diff] [blame]	113	/* Mark the current vcpu as waiting. */
				114	sl_lock(&current->lock);
				115	current->state = secondary_state;
				116	sl_unlock(&current->lock);
				117
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	118	return next;
				119	}
				120
				121	/**
Andrew Scull	33fecd3	2019-01-08 14:48:27 +0000	[diff] [blame]	122	* Returns to the primary vm and signals that the vcpu still has work to do so.
				123	*/
				124	struct vcpu api_preempt(struct vcpu current)
				125	{
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	126	struct spci_value ret = {
				127	.func = SPCI_INTERRUPT_32,
				128	.arg1 = ((uint32_t)current->vm->id << 16) \| vcpu_index(current),
Andrew Scull	33fecd3	2019-01-08 14:48:27 +0000	[diff] [blame]	129	};
				130
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	131	return api_switch_to_primary(current, ret, VCPU_STATE_READY);
Andrew Scull	33fecd3	2019-01-08 14:48:27 +0000	[diff] [blame]	132	}
				133
				134	/**
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	135	* Puts the current vcpu in wait for interrupt mode, and returns to the primary
				136	* vm.
				137	*/
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	138	struct vcpu api_wait_for_interrupt(struct vcpu current)
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	139	{
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	140	struct spci_value ret = {
				141	.func = HF_SPCI_RUN_WAIT_FOR_INTERRUPT,
				142	.arg1 = ((uint32_t)vcpu_index(current) << 16) \| current->vm->id,
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	143	};
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	144
Wedson Almeida Filho	ba641ef	2018-12-03 04:19:44 +0000	[diff] [blame]	145	return api_switch_to_primary(current, ret,
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	146	VCPU_STATE_BLOCKED_INTERRUPT);
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	147	}
				148
				149	/**
Andrew Walbran	3364565	2019-04-15 12:29:31 +0100	[diff] [blame]	150	* Puts the current vCPU in off mode, and returns to the primary VM.
				151	*/
				152	struct vcpu api_vcpu_off(struct vcpu current)
				153	{
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	154	struct spci_value ret = {
				155	.func = HF_SPCI_RUN_WAIT_FOR_INTERRUPT,
				156	.arg1 = ((uint32_t)vcpu_index(current) << 16) \| current->vm->id,
Andrew Walbran	3364565	2019-04-15 12:29:31 +0100	[diff] [blame]	157	};
				158
				159	/*
				160	* Disable the timer, so the scheduler doesn't get told to call back
				161	* based on it.
				162	*/
				163	arch_timer_disable_current();
				164
				165	return api_switch_to_primary(current, ret, VCPU_STATE_OFF);
				166	}
				167
				168	/**
Andrew Scull	66d62bf	2019-02-01 13:54:10 +0000	[diff] [blame]	169	* Returns to the primary vm to allow this cpu to be used for other tasks as the
				170	* vcpu does not have work to do at this moment. The current vcpu is marked as
Andrew Walbran	16075b6	2019-09-03 17:11:07 +0100	[diff] [blame]	171	* ready to be scheduled again.
Andrew Scull	66d62bf	2019-02-01 13:54:10 +0000	[diff] [blame]	172	*/
Andrew Walbran	16075b6	2019-09-03 17:11:07 +0100	[diff] [blame]	173	void api_yield(struct vcpu current, struct vcpu *next)
Andrew Scull	66d62bf	2019-02-01 13:54:10 +0000	[diff] [blame]	174	{
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	175	struct spci_value primary_ret = {
				176	.func = SPCI_YIELD_32,
				177	.arg1 = ((uint32_t)vcpu_index(current) << 16) \| current->vm->id,
Andrew Scull	66d62bf	2019-02-01 13:54:10 +0000	[diff] [blame]	178	};
				179
				180	if (current->vm->id == HF_PRIMARY_VM_ID) {
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	181	/* Noop on the primary as it makes the scheduling decisions. */
Andrew Walbran	16075b6	2019-09-03 17:11:07 +0100	[diff] [blame]	182	return;
Andrew Scull	66d62bf	2019-02-01 13:54:10 +0000	[diff] [blame]	183	}
				184
Andrew Walbran	16075b6	2019-09-03 17:11:07 +0100	[diff] [blame]	185	*next = api_switch_to_primary(current, primary_ret, VCPU_STATE_READY);
Andrew Scull	66d62bf	2019-02-01 13:54:10 +0000	[diff] [blame]	186	}
				187
				188	/**
Andrew Walbran	3364565	2019-04-15 12:29:31 +0100	[diff] [blame]	189	* Switches to the primary so that it can switch to the target, or kick it if it
				190	* is already running on a different physical CPU.
				191	*/
				192	struct vcpu api_wake_up(struct vcpu current, struct vcpu *target_vcpu)
				193	{
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	194	struct spci_value ret = {
				195	.func = HF_SPCI_RUN_WAKE_UP,
				196	.arg1 = ((uint32_t)vcpu_index(target_vcpu) << 16) \|
				197	target_vcpu->vm->id,
Andrew Walbran	3364565	2019-04-15 12:29:31 +0100	[diff] [blame]	198	};
				199	return api_switch_to_primary(current, ret, VCPU_STATE_READY);
				200	}
				201
				202	/**
Andrew Scull	38772ab	2019-01-24 15:16:50 +0000	[diff] [blame]	203	* Aborts the vCPU and triggers its VM to abort fully.
Andrew Scull	9726c25	2019-01-23 13:44:19 +0000	[diff] [blame]	204	*/
				205	struct vcpu api_abort(struct vcpu current)
				206	{
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	207	struct spci_value ret = spci_error(SPCI_ABORTED);
Andrew Scull	9726c25	2019-01-23 13:44:19 +0000	[diff] [blame]	208
				209	dlog("Aborting VM %u vCPU %u\n", current->vm->id, vcpu_index(current));
				210
				211	if (current->vm->id == HF_PRIMARY_VM_ID) {
				212	/* TODO: what to do when the primary aborts? */
				213	for (;;) {
				214	/* Do nothing. */
				215	}
				216	}
				217
				218	atomic_store_explicit(&current->vm->aborting, true,
				219	memory_order_relaxed);
				220
				221	/* TODO: free resources once all vCPUs abort. */
				222
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	223	return api_switch_to_primary(current, ret, VCPU_STATE_ABORTED);
Andrew Scull	9726c25	2019-01-23 13:44:19 +0000	[diff] [blame]	224	}
				225
				226	/**
Andrew Scull	55c4d8b	2018-12-18 18:50:18 +0000	[diff] [blame]	227	* Returns the ID of the VM.
				228	*/
Andrew Walbran	d230f66	2019-10-07 18:03:36 +0100	[diff] [blame]	229	struct spci_value api_spci_id_get(const struct vcpu *current)
Andrew Scull	55c4d8b	2018-12-18 18:50:18 +0000	[diff] [blame]	230	{
Andrew Walbran	d230f66	2019-10-07 18:03:36 +0100	[diff] [blame]	231	return (struct spci_value){.func = SPCI_SUCCESS_32,
				232	.arg2 = current->vm->id};
Andrew Scull	55c4d8b	2018-12-18 18:50:18 +0000	[diff] [blame]	233	}
				234
				235	/**
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	236	* Returns the number of VMs configured to run.
				237	*/
Andrew Walbran	52d9967	2019-06-25 15:51:11 +0100	[diff] [blame]	238	spci_vm_count_t api_vm_get_count(void)
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	239	{
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	240	return vm_get_count();
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	241	}
				242
				243	/**
Andrew Walbran	c6d23c4	2019-06-26 13:30:42 +0100	[diff] [blame]	244	* Returns the number of vCPUs configured in the given VM, or 0 if there is no
				245	* such VM or the caller is not the primary VM.
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	246	*/
Andrew Walbran	c6d23c4	2019-06-26 13:30:42 +0100	[diff] [blame]	247	spci_vcpu_count_t api_vcpu_get_count(spci_vm_id_t vm_id,
				248	const struct vcpu *current)
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	249	{
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	250	struct vm *vm;
				251
				252	/* Only the primary VM needs to know about vcpus for scheduling. */
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	253	if (current->vm->id != HF_PRIMARY_VM_ID) {
Andrew Walbran	c6d23c4	2019-06-26 13:30:42 +0100	[diff] [blame]	254	return 0;
Andrew Scull	7364a8e	2018-07-19 15:39:29 +0100	[diff] [blame]	255	}
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	256
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	257	vm = vm_find(vm_id);
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	258	if (vm == NULL) {
Andrew Walbran	c6d23c4	2019-06-26 13:30:42 +0100	[diff] [blame]	259	return 0;
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	260	}
				261
				262	return vm->vcpu_count;
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	263	}
				264
				265	/**
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	266	* This function is called by the architecture-specific context switching
				267	* function to indicate that register state for the given vcpu has been saved
				268	* and can therefore be used by other pcpus.
				269	*/
				270	void api_regs_state_saved(struct vcpu *vcpu)
				271	{
				272	sl_lock(&vcpu->lock);
				273	vcpu->regs_available = true;
				274	sl_unlock(&vcpu->lock);
				275	}
				276
				277	/**
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	278	* Retrieves the next waiter and removes it from the wait list if the VM's
				279	* mailbox is in a writable state.
				280	*/
				281	static struct wait_entry *api_fetch_waiter(struct vm_locked locked_vm)
				282	{
				283	struct wait_entry *entry;
				284	struct vm *vm = locked_vm.vm;
				285
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	286	if (vm->mailbox.state != MAILBOX_STATE_EMPTY \|\|
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	287	vm->mailbox.recv == NULL \|\| list_empty(&vm->mailbox.waiter_list)) {
				288	/* The mailbox is not writable or there are no waiters. */
				289	return NULL;
				290	}
				291
				292	/* Remove waiter from the wait list. */
				293	entry = CONTAINER_OF(vm->mailbox.waiter_list.next, struct wait_entry,
				294	wait_links);
				295	list_remove(&entry->wait_links);
				296	return entry;
				297	}
				298
				299	/**
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	300	* Assuming that the arguments have already been checked by the caller, injects
				301	* a virtual interrupt of the given ID into the given target vCPU. This doesn't
				302	* cause the vCPU to actually be run immediately; it will be taken when the vCPU
				303	* is next run, which is up to the scheduler.
				304	*
				305	* Returns:
				306	* - 0 on success if no further action is needed.
				307	* - 1 if it was called by the primary VM and the primary VM now needs to wake
				308	* up or kick the target vCPU.
				309	*/
Andrew Walbran	fc9d438	2019-05-10 18:07:21 +0100	[diff] [blame]	310	static int64_t internal_interrupt_inject(struct vcpu *target_vcpu,
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	311	uint32_t intid, struct vcpu *current,
				312	struct vcpu **next)
				313	{
				314	uint32_t intid_index = intid / INTERRUPT_REGISTER_BITS;
Andrew Walbran	e52006c	2019-10-22 18:01:28 +0100	[diff] [blame]	315	uint32_t intid_mask = 1U << (intid % INTERRUPT_REGISTER_BITS);
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	316	int64_t ret = 0;
				317
				318	sl_lock(&target_vcpu->lock);
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	319
				320	/*
				321	* We only need to change state and (maybe) trigger a virtual IRQ if it
				322	* is enabled and was not previously pending. Otherwise we can skip
				323	* everything except setting the pending bit.
				324	*
				325	* If you change this logic make sure to update the need_vm_lock logic
				326	* above to match.
				327	*/
				328	if (!(target_vcpu->interrupts.interrupt_enabled[intid_index] &
				329	~target_vcpu->interrupts.interrupt_pending[intid_index] &
				330	intid_mask)) {
				331	goto out;
				332	}
				333
				334	/* Increment the count. */
				335	target_vcpu->interrupts.enabled_and_pending_count++;
				336
				337	/*
				338	* Only need to update state if there was not already an
				339	* interrupt enabled and pending.
				340	*/
				341	if (target_vcpu->interrupts.enabled_and_pending_count != 1) {
				342	goto out;
				343	}
				344
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	345	if (current->vm->id == HF_PRIMARY_VM_ID) {
				346	/*
				347	* If the call came from the primary VM, let it know that it
				348	* should run or kick the target vCPU.
				349	*/
				350	ret = 1;
				351	} else if (current != target_vcpu && next != NULL) {
Andrew Walbran	3364565	2019-04-15 12:29:31 +0100	[diff] [blame]	352	*next = api_wake_up(current, target_vcpu);
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	353	}
				354
				355	out:
				356	/* Either way, make it pending. */
				357	target_vcpu->interrupts.interrupt_pending[intid_index] \|= intid_mask;
				358
				359	sl_unlock(&target_vcpu->lock);
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	360
				361	return ret;
				362	}
				363
				364	/**
Andrew Walbran	d4d2fa1	2019-10-01 16:47:25 +0100	[diff] [blame]	365	* Constructs an SPCI_MSG_SEND value to return from a successful SPCI_MSG_POLL
				366	* or SPCI_MSG_WAIT call.
				367	*/
				368	static struct spci_value spci_msg_recv_return(const struct vm *receiver)
				369	{
				370	return (struct spci_value){
				371	.func = SPCI_MSG_SEND_32,
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	372	.arg1 = (receiver->mailbox.recv_sender << 16) \| receiver->id,
				373	.arg3 = receiver->mailbox.recv_size,
				374	.arg4 = receiver->mailbox.recv_attributes};
Andrew Walbran	d4d2fa1	2019-10-01 16:47:25 +0100	[diff] [blame]	375	}
				376
				377	/**
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	378	* Prepares the vcpu to run by updating its state and fetching whether a return
				379	* value needs to be forced onto the vCPU.
				380	*/
Andrew Scull	38772ab	2019-01-24 15:16:50 +0000	[diff] [blame]	381	static bool api_vcpu_prepare_run(const struct vcpu current, struct vcpu vcpu,
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	382	struct spci_value *run_ret)
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	383	{
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	384	bool need_vm_lock;
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	385	bool ret;
				386
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	387	/*
Andrew Scull	4caadaf	2019-07-03 13:13:47 +0100	[diff] [blame]	388	* Wait until the registers become available. All locks must be released
				389	* between iterations of this loop to avoid potential deadlocks if, on
				390	* any path, a lock needs to be taken after taking the decision to
				391	* switch context but before the registers have been saved.
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	392	*
Andrew Scull	4caadaf	2019-07-03 13:13:47 +0100	[diff] [blame]	393	* The VM lock is not needed in the common case so it must only be taken
				394	* when it is going to be needed. This ensures there are no inter-vCPU
				395	* dependencies in the common run case meaning the sensitive context
				396	* switch performance is consistent.
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	397	*/
				398	for (;;) {
				399	sl_lock(&vcpu->lock);
				400
				401	/* The VM needs to be locked to deliver mailbox messages. */
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	402	need_vm_lock = vcpu->state == VCPU_STATE_BLOCKED_MAILBOX;
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	403	if (need_vm_lock) {
				404	sl_unlock(&vcpu->lock);
				405	sl_lock(&vcpu->vm->lock);
				406	sl_lock(&vcpu->lock);
				407	}
				408
				409	if (vcpu->regs_available) {
				410	break;
				411	}
				412
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	413	if (vcpu->state == VCPU_STATE_RUNNING) {
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	414	/*
				415	* vCPU is running on another pCPU.
				416	*
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	417	* It's okay not to return the sleep duration here
				418	* because the other physical CPU that is currently
				419	* running this vCPU will return the sleep duration if
				420	* needed.
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	421	*/
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	422	*run_ret = spci_error(SPCI_BUSY);
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	423	ret = false;
				424	goto out;
				425	}
				426
				427	sl_unlock(&vcpu->lock);
				428	if (need_vm_lock) {
				429	sl_unlock(&vcpu->vm->lock);
				430	}
				431	}
Andrew Scull	9726c25	2019-01-23 13:44:19 +0000	[diff] [blame]	432
				433	if (atomic_load_explicit(&vcpu->vm->aborting, memory_order_relaxed)) {
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	434	if (vcpu->state != VCPU_STATE_ABORTED) {
Andrew Scull	8233128	2019-01-25 10:29:34 +0000	[diff] [blame]	435	dlog("Aborting VM %u vCPU %u\n", vcpu->vm->id,
				436	vcpu_index(vcpu));
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	437	vcpu->state = VCPU_STATE_ABORTED;
Andrew Scull	9726c25	2019-01-23 13:44:19 +0000	[diff] [blame]	438	}
				439	ret = false;
				440	goto out;
				441	}
				442
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	443	switch (vcpu->state) {
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	444	case VCPU_STATE_RUNNING:
				445	case VCPU_STATE_OFF:
				446	case VCPU_STATE_ABORTED:
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	447	ret = false;
				448	goto out;
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	449
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	450	case VCPU_STATE_BLOCKED_MAILBOX:
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	451	/*
				452	* A pending message allows the vCPU to run so the message can
				453	* be delivered directly.
				454	*/
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	455	if (vcpu->vm->mailbox.state == MAILBOX_STATE_RECEIVED) {
Andrew Walbran	d4d2fa1	2019-10-01 16:47:25 +0100	[diff] [blame]	456	arch_regs_set_retval(&vcpu->regs,
				457	spci_msg_recv_return(vcpu->vm));
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	458	vcpu->vm->mailbox.state = MAILBOX_STATE_READ;
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	459	break;
				460	}
				461	/* Fall through. */
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	462	case VCPU_STATE_BLOCKED_INTERRUPT:
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	463	/* Allow virtual interrupts to be delivered. */
				464	if (vcpu->interrupts.enabled_and_pending_count > 0) {
				465	break;
				466	}
				467
				468	/* The timer expired so allow the interrupt to be delivered. */
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	469	if (arch_timer_pending(&vcpu->regs)) {
				470	break;
				471	}
				472
				473	/*
				474	* The vCPU is not ready to run, return the appropriate code to
				475	* the primary which called vcpu_run.
				476	*/
				477	if (arch_timer_enabled(&vcpu->regs)) {
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	478	run_ret->func =
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	479	vcpu->state == VCPU_STATE_BLOCKED_MAILBOX
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	480	? SPCI_MSG_WAIT_32
				481	: HF_SPCI_RUN_WAIT_FOR_INTERRUPT;
				482	run_ret->arg1 = ((uint32_t)vcpu_index(vcpu) << 16) \|
				483	vcpu->vm->id;
				484	/*
				485	* arch_timer_remaining_ns should never return 0,
				486	* because if it would then arch_timer_pending would
				487	* have returned true before and so we won't get here.
				488	*/
				489	run_ret->arg2 = arch_timer_remaining_ns(&vcpu->regs);
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	490	}
				491
				492	ret = false;
				493	goto out;
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	494
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	495	case VCPU_STATE_READY:
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	496	break;
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	497	}
				498
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	499	/* It has been decided that the vCPU should be run. */
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	500	vcpu->cpu = current->cpu;
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	501	vcpu->state = VCPU_STATE_RUNNING;
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	502
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	503	/*
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	504	* Mark the registers as unavailable now that we're about to reflect
				505	* them onto the real registers. This will also prevent another physical
				506	* CPU from trying to read these registers.
				507	*/
				508	vcpu->regs_available = false;
				509
				510	ret = true;
				511
				512	out:
				513	sl_unlock(&vcpu->lock);
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	514	if (need_vm_lock) {
				515	sl_unlock(&vcpu->vm->lock);
				516	}
				517
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	518	return ret;
				519	}
				520
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	521	struct spci_value api_spci_run(spci_vm_id_t vm_id, spci_vcpu_index_t vcpu_idx,
				522	const struct vcpu current, struct vcpu *next)
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	523	{
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	524	struct vm *vm;
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	525	struct vcpu *vcpu;
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	526	struct spci_value ret = spci_error(SPCI_INVALID_PARAMETERS);
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	527
				528	/* Only the primary VM can switch vcpus. */
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	529	if (current->vm->id != HF_PRIMARY_VM_ID) {
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	530	ret.arg2 = SPCI_DENIED;
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	531	goto out;
Andrew Scull	7364a8e	2018-07-19 15:39:29 +0100	[diff] [blame]	532	}
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	533
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	534	/* Only secondary VM vcpus can be run. */
				535	if (vm_id == HF_PRIMARY_VM_ID) {
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	536	goto out;
Andrew Scull	7364a8e	2018-07-19 15:39:29 +0100	[diff] [blame]	537	}
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	538
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	539	/* The requested VM must exist. */
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	540	vm = vm_find(vm_id);
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	541	if (vm == NULL) {
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	542	goto out;
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	543	}
				544
				545	/* The requested vcpu must exist. */
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	546	if (vcpu_idx >= vm->vcpu_count) {
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	547	goto out;
Andrew Scull	7364a8e	2018-07-19 15:39:29 +0100	[diff] [blame]	548	}
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	549
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	550	/* Update state if allowed. */
Andrew Walbran	e1310df	2019-04-29 17:28:28 +0100	[diff] [blame]	551	vcpu = vm_get_vcpu(vm, vcpu_idx);
Andrew Scull	b06d175	2019-02-04 10:15:48 +0000	[diff] [blame]	552	if (!api_vcpu_prepare_run(current, vcpu, &ret)) {
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	553	goto out;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	554	}
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	555
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	556	/*
				557	* Inject timer interrupt if timer has expired. It's safe to access
				558	* vcpu->regs here because api_vcpu_prepare_run already made sure that
				559	* regs_available was true (and then set it to false) before returning
				560	* true.
				561	*/
				562	if (arch_timer_pending(&vcpu->regs)) {
				563	/* Make virtual timer interrupt pending. */
Andrew Walbran	fc9d438	2019-05-10 18:07:21 +0100	[diff] [blame]	564	internal_interrupt_inject(vcpu, HF_VIRTUAL_TIMER_INTID, vcpu,
				565	NULL);
Andrew Walbran	508e63c	2018-12-20 17:02:37 +0000	[diff] [blame]	566
				567	/*
				568	* Set the mask bit so the hardware interrupt doesn't fire
				569	* again. Ideally we wouldn't do this because it affects what
				570	* the secondary vCPU sees, but if we don't then we end up with
				571	* a loop of the interrupt firing each time we try to return to
				572	* the secondary vCPU.
				573	*/
				574	arch_timer_mask(&vcpu->regs);
				575	}
				576
Andrew Scull	33fecd3	2019-01-08 14:48:27 +0000	[diff] [blame]	577	/* Switch to the vcpu. */
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	578	*next = vcpu;
Wedson Almeida Filho	0330611	2018-11-26 00:08:03 +0000	[diff] [blame]	579
Andrew Scull	33fecd3	2019-01-08 14:48:27 +0000	[diff] [blame]	580	/*
				581	* Set a placeholder return code to the scheduler. This will be
				582	* overwritten when the switch back to the primary occurs.
				583	*/
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	584	ret.func = SPCI_INTERRUPT_32;
				585	ret.arg1 = ((uint32_t)vm_id << 16) \| vcpu_idx;
				586	ret.arg2 = 0;
Andrew Scull	33fecd3	2019-01-08 14:48:27 +0000	[diff] [blame]	587
Andrew Scull	6d2db33	2018-10-10 15:28:17 +0100	[diff] [blame]	588	out:
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	589	return ret;
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	590	}
				591
				592	/**
Andrew Scull	81e8509	2018-12-12 12:56:20 +0000	[diff] [blame]	593	* Check that the mode indicates memory that is valid, owned and exclusive.
				594	*/
Andrew Walbran	1281ed4	2019-10-22 17:23:40 +0100	[diff] [blame]	595	static bool api_mode_valid_owned_and_exclusive(uint32_t mode)
Andrew Scull	81e8509	2018-12-12 12:56:20 +0000	[diff] [blame]	596	{
Andrew Scull	b5f49e0	2019-10-02 13:20:47 +0100	[diff] [blame]	597	return (mode & (MM_MODE_D \| MM_MODE_INVALID \| MM_MODE_UNOWNED \|
				598	MM_MODE_SHARED)) == 0;
Andrew Scull	81e8509	2018-12-12 12:56:20 +0000	[diff] [blame]	599	}
				600
				601	/**
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	602	* Determines the value to be returned by api_vm_configure and api_mailbox_clear
				603	* after they've succeeded. If a secondary VM is running and there are waiters,
				604	* it also switches back to the primary VM for it to wake waiters up.
				605	*/
				606	static int64_t api_waiter_result(struct vm_locked locked_vm,
				607	struct vcpu current, struct vcpu *next)
				608	{
				609	struct vm *vm = locked_vm.vm;
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	610	struct spci_value ret = {
				611	.func = SPCI_RX_RELEASE_32,
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	612	};
				613
				614	if (list_empty(&vm->mailbox.waiter_list)) {
				615	/* No waiters, nothing else to do. */
				616	return 0;
				617	}
				618
				619	if (vm->id == HF_PRIMARY_VM_ID) {
				620	/* The caller is the primary VM. Tell it to wake up waiters. */
				621	return 1;
				622	}
				623
				624	/*
				625	* Switch back to the primary VM, informing it that there are waiters
				626	* that need to be notified.
				627	*/
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	628	*next = api_switch_to_primary(current, ret, VCPU_STATE_READY);
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	629
				630	return 0;
				631	}
				632
				633	/**
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	634	* Configures the hypervisor's stage-1 view of the send and receive pages. The
				635	* stage-1 page tables must be locked so memory cannot be taken by another core
				636	* which could result in this transaction being unable to roll back in the case
				637	* of an error.
				638	*/
				639	static bool api_vm_configure_stage1(struct vm_locked vm_locked,
				640	paddr_t pa_send_begin, paddr_t pa_send_end,
				641	paddr_t pa_recv_begin, paddr_t pa_recv_end,
				642	struct mpool *local_page_pool)
				643	{
				644	bool ret;
				645	struct mm_stage1_locked mm_stage1_locked = mm_lock_stage1();
				646
				647	/* Map the send page as read-only in the hypervisor address space. */
				648	vm_locked.vm->mailbox.send =
				649	mm_identity_map(mm_stage1_locked, pa_send_begin, pa_send_end,
				650	MM_MODE_R, local_page_pool);
				651	if (!vm_locked.vm->mailbox.send) {
				652	/* TODO: partial defrag of failed range. */
				653	/* Recover any memory consumed in failed mapping. */
				654	mm_defrag(mm_stage1_locked, local_page_pool);
				655	goto fail;
				656	}
				657
				658	/*
				659	* Map the receive page as writable in the hypervisor address space. On
				660	* failure, unmap the send page before returning.
				661	*/
				662	vm_locked.vm->mailbox.recv =
				663	mm_identity_map(mm_stage1_locked, pa_recv_begin, pa_recv_end,
				664	MM_MODE_W, local_page_pool);
				665	if (!vm_locked.vm->mailbox.recv) {
				666	/* TODO: partial defrag of failed range. */
				667	/* Recover any memory consumed in failed mapping. */
				668	mm_defrag(mm_stage1_locked, local_page_pool);
				669	goto fail_undo_send;
				670	}
				671
				672	ret = true;
				673	goto out;
				674
				675	/*
				676	* The following mappings will not require more memory than is available
				677	* in the local pool.
				678	*/
				679	fail_undo_send:
				680	vm_locked.vm->mailbox.send = NULL;
Andrew Scull	7e8de32	2019-07-02 13:00:56 +0100	[diff] [blame]	681	CHECK(mm_unmap(mm_stage1_locked, pa_send_begin, pa_send_end,
				682	local_page_pool));
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	683
				684	fail:
				685	ret = false;
				686
				687	out:
				688	mm_unlock_stage1(&mm_stage1_locked);
				689
				690	return ret;
				691	}
				692
				693	/**
				694	* Configures the send and receive pages in the VM stage-2 and hypervisor
				695	* stage-1 page tables. Locking of the page tables combined with a local memory
				696	* pool ensures there will always be enough memory to recover from any errors
				697	* that arise.
				698	*/
				699	static bool api_vm_configure_pages(struct vm_locked vm_locked,
				700	paddr_t pa_send_begin, paddr_t pa_send_end,
Andrew Walbran	1281ed4	2019-10-22 17:23:40 +0100	[diff] [blame]	701	uint32_t orig_send_mode,
				702	paddr_t pa_recv_begin, paddr_t pa_recv_end,
				703	uint32_t orig_recv_mode)
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	704	{
				705	bool ret;
				706	struct mpool local_page_pool;
				707
				708	/*
				709	* Create a local pool so any freed memory can't be used by another
				710	* thread. This is to ensure the original mapping can be restored if any
				711	* stage of the process fails.
				712	*/
				713	mpool_init_with_fallback(&local_page_pool, &api_page_pool);
				714
				715	/* Take memory ownership away from the VM and mark as shared. */
				716	if (!mm_vm_identity_map(
				717	&vm_locked.vm->ptable, pa_send_begin, pa_send_end,
				718	MM_MODE_UNOWNED \| MM_MODE_SHARED \| MM_MODE_R \| MM_MODE_W,
				719	NULL, &local_page_pool)) {
				720	goto fail;
				721	}
				722
				723	if (!mm_vm_identity_map(&vm_locked.vm->ptable, pa_recv_begin,
				724	pa_recv_end,
				725	MM_MODE_UNOWNED \| MM_MODE_SHARED \| MM_MODE_R,
				726	NULL, &local_page_pool)) {
				727	/* TODO: partial defrag of failed range. */
				728	/* Recover any memory consumed in failed mapping. */
				729	mm_vm_defrag(&vm_locked.vm->ptable, &local_page_pool);
				730	goto fail_undo_send;
				731	}
				732
				733	if (!api_vm_configure_stage1(vm_locked, pa_send_begin, pa_send_end,
				734	pa_recv_begin, pa_recv_end,
				735	&local_page_pool)) {
				736	goto fail_undo_send_and_recv;
				737	}
				738
				739	ret = true;
				740	goto out;
				741
				742	/*
				743	* The following mappings will not require more memory than is available
				744	* in the local pool.
				745	*/
				746	fail_undo_send_and_recv:
Andrew Scull	7e8de32	2019-07-02 13:00:56 +0100	[diff] [blame]	747	CHECK(mm_vm_identity_map(&vm_locked.vm->ptable, pa_recv_begin,
				748	pa_recv_end, orig_recv_mode, NULL,
				749	&local_page_pool));
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	750
				751	fail_undo_send:
Andrew Scull	7e8de32	2019-07-02 13:00:56 +0100	[diff] [blame]	752	CHECK(mm_vm_identity_map(&vm_locked.vm->ptable, pa_send_begin,
				753	pa_send_end, orig_send_mode, NULL,
				754	&local_page_pool));
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	755
				756	fail:
				757	ret = false;
				758
				759	out:
				760	mpool_fini(&local_page_pool);
				761
				762	return ret;
				763	}
				764
				765	/**
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	766	* Configures the VM to send/receive data through the specified pages. The pages
				767	* must not be shared.
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	768	*
				769	* Returns:
				770	* - -1 on failure.
				771	* - 0 on success if no further action is needed.
				772	* - 1 if it was called by the primary VM and the primary VM now needs to wake
				773	* up or kick waiters. Waiters should be retrieved by calling
				774	* hf_mailbox_waiter_get.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	775	*/
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	776	int64_t api_vm_configure(ipaddr_t send, ipaddr_t recv, struct vcpu *current,
				777	struct vcpu **next)
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	778	{
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	779	struct vm *vm = current->vm;
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	780	struct vm_locked vm_locked;
Andrew Scull	8087132	2018-08-06 12:04:09 +0100	[diff] [blame]	781	paddr_t pa_send_begin;
				782	paddr_t pa_send_end;
				783	paddr_t pa_recv_begin;
				784	paddr_t pa_recv_end;
Andrew Walbran	1281ed4	2019-10-22 17:23:40 +0100	[diff] [blame]	785	uint32_t orig_send_mode;
				786	uint32_t orig_recv_mode;
Andrew Scull	c0e569a	2018-10-02 18:05:21 +0100	[diff] [blame]	787	int64_t ret;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	788
				789	/* Fail if addresses are not page-aligned. */
Alfredo Mazzinghi	eb1997c	2019-02-07 18:00:01 +0000	[diff] [blame]	790	if (!is_aligned(ipa_addr(send), PAGE_SIZE) \|\|
				791	!is_aligned(ipa_addr(recv), PAGE_SIZE)) {
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	792	return -1;
				793	}
				794
Andrew Scull	c2eb6a3	2018-12-13 16:54:24 +0000	[diff] [blame]	795	/* Convert to physical addresses. */
				796	pa_send_begin = pa_from_ipa(send);
				797	pa_send_end = pa_add(pa_send_begin, PAGE_SIZE);
				798
				799	pa_recv_begin = pa_from_ipa(recv);
				800	pa_recv_end = pa_add(pa_recv_begin, PAGE_SIZE);
				801
Andrew Scull	c9ccb3f	2018-08-13 15:27:12 +0100	[diff] [blame]	802	/* Fail if the same page is used for the send and receive pages. */
				803	if (pa_addr(pa_send_begin) == pa_addr(pa_recv_begin)) {
Andrew Scull	220e621	2018-12-21 18:09:00 +0000	[diff] [blame]	804	return -1;
				805	}
				806
Andrew Scull	3c0a90a	2019-07-01 11:55:53 +0100	[diff] [blame]	807	/*
				808	* The hypervisor's memory map must be locked for the duration of this
				809	* operation to ensure there will be sufficient memory to recover from
				810	* any failures.
				811	*
				812	* TODO: the scope of the can be reduced but will require restructuring
				813	* to keep a single unlock point.
				814	*/
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	815	vm_locked = vm_lock(vm);
Andrew Scull	220e621	2018-12-21 18:09:00 +0000	[diff] [blame]	816
				817	/* We only allow these to be setup once. */
				818	if (vm->mailbox.send \|\| vm->mailbox.recv) {
				819	goto fail;
				820	}
				821
				822	/*
				823	* Ensure the pages are valid, owned and exclusive to the VM and that
				824	* the VM has the required access to the memory.
				825	*/
				826	if (!mm_vm_get_mode(&vm->ptable, send, ipa_add(send, PAGE_SIZE),
				827	&orig_send_mode) \|\|
				828	!api_mode_valid_owned_and_exclusive(orig_send_mode) \|\|
				829	(orig_send_mode & MM_MODE_R) == 0 \|\|
				830	(orig_send_mode & MM_MODE_W) == 0) {
				831	goto fail;
				832	}
				833
				834	if (!mm_vm_get_mode(&vm->ptable, recv, ipa_add(recv, PAGE_SIZE),
				835	&orig_recv_mode) \|\|
				836	!api_mode_valid_owned_and_exclusive(orig_recv_mode) \|\|
				837	(orig_recv_mode & MM_MODE_R) == 0) {
				838	goto fail;
				839	}
				840
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	841	if (!api_vm_configure_pages(vm_locked, pa_send_begin, pa_send_end,
				842	orig_send_mode, pa_recv_begin, pa_recv_end,
				843	orig_recv_mode)) {
				844	goto fail;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	845	}
				846
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	847	/* Tell caller about waiters, if any. */
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	848	ret = api_waiter_result(vm_locked, current, next);
Andrew Scull	220e621	2018-12-21 18:09:00 +0000	[diff] [blame]	849	goto exit;
				850
Andrew Scull	220e621	2018-12-21 18:09:00 +0000	[diff] [blame]	851	fail:
				852	ret = -1;
				853
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	854	exit:
Andrew Scull	e132279	2019-07-01 17:46:10 +0100	[diff] [blame]	855	vm_unlock(&vm_locked);
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	856
				857	return ret;
				858	}
				859
				860	/**
Andrew Walbran	e0f575f	2019-10-16 16:00:12 +0100	[diff] [blame]	861	* Checks whether the given `to` VM's mailbox is currently busy, and optionally
				862	* registers the `from` VM to be notified when it becomes available.
				863	*/
				864	static bool msg_receiver_busy(struct vm_locked to, struct vm_locked from,
				865	bool notify)
				866	{
				867	if (to.vm->mailbox.state != MAILBOX_STATE_EMPTY \|\|
				868	to.vm->mailbox.recv == NULL) {
				869	/*
				870	* Fail if the receiver isn't currently ready to receive data,
				871	* setting up for notification if requested.
				872	*/
				873	if (notify) {
				874	struct wait_entry *entry =
				875	&from.vm->wait_entries[to.vm->id];
				876
				877	/* Append waiter only if it's not there yet. */
				878	if (list_empty(&entry->wait_links)) {
				879	list_append(&to.vm->mailbox.waiter_list,
				880	&entry->wait_links);
				881	}
				882	}
				883
				884	return true;
				885	}
				886
				887	return false;
				888	}
				889
				890	/**
				891	* Notifies the `to` VM about the message currently in its mailbox, possibly
				892	* with the help of the primary VM.
				893	*/
				894	static void deliver_msg(struct vm_locked to, struct vm_locked from,
				895	uint32_t size, struct vcpu current, struct vcpu *next)
				896	{
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	897	struct spci_value primary_ret = {
				898	.func = SPCI_MSG_SEND_32,
				899	.arg1 = ((uint32_t)from.vm->id << 16) \| to.vm->id,
Andrew Walbran	e0f575f	2019-10-16 16:00:12 +0100	[diff] [blame]	900	};
				901
Andrew Walbran	e0f575f	2019-10-16 16:00:12 +0100	[diff] [blame]	902	/* Messages for the primary VM are delivered directly. */
				903	if (to.vm->id == HF_PRIMARY_VM_ID) {
				904	/*
				905	* Only tell the primary VM the size if the message is for it,
				906	* to avoid leaking data about messages for other VMs.
				907	*/
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	908	primary_ret.arg3 = size;
Andrew Walbran	e0f575f	2019-10-16 16:00:12 +0100	[diff] [blame]	909
				910	to.vm->mailbox.state = MAILBOX_STATE_READ;
				911	*next = api_switch_to_primary(current, primary_ret,
				912	VCPU_STATE_READY);
				913	return;
				914	}
				915
				916	to.vm->mailbox.state = MAILBOX_STATE_RECEIVED;
				917
				918	/* Return to the primary VM directly or with a switch. */
				919	if (from.vm->id != HF_PRIMARY_VM_ID) {
				920	*next = api_switch_to_primary(current, primary_ret,
				921	VCPU_STATE_READY);
				922	}
				923	}
				924
				925	/**
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	926	* Copies data from the sender's send buffer to the recipient's receive buffer
				927	* and notifies the recipient.
Wedson Almeida Filho	17c997f	2019-01-09 18:50:09 +0000	[diff] [blame]	928	*
				929	* If the recipient's receive buffer is busy, it can optionally register the
				930	* caller to be notified when the recipient's receive buffer becomes available.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	931	*/
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	932	struct spci_value api_spci_msg_send(spci_vm_id_t sender_vm_id,
				933	spci_vm_id_t receiver_vm_id, uint32_t size,
				934	uint32_t attributes, struct vcpu *current,
				935	struct vcpu **next)
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	936	{
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	937	struct vm *from = current->vm;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	938	struct vm *to;
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	939
Andrew Walbran	f659596	2019-10-15 16:47:56 +0100	[diff] [blame]	940	struct two_vm_locked vm_to_from_lock;
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	941
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	942	const void *from_msg;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	943
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	944	struct spci_value ret;
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	945	bool notify = (attributes & SPCI_MSG_SEND_NOTIFY_MASK) ==
				946	SPCI_MSG_SEND_NOTIFY;
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	947
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	948	/* Ensure sender VM ID corresponds to the current VM. */
				949	if (sender_vm_id != from->id) {
				950	return spci_error(SPCI_INVALID_PARAMETERS);
				951	}
				952
				953	/* Disallow reflexive requests as this suggests an error in the VM. */
				954	if (receiver_vm_id == from->id) {
				955	return spci_error(SPCI_INVALID_PARAMETERS);
				956	}
				957
				958	/* Limit the size of transfer. */
				959	if (size > SPCI_MSG_PAYLOAD_MAX) {
				960	return spci_error(SPCI_INVALID_PARAMETERS);
				961	}
				962
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	963	/*
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	964	* Check that the sender has configured its send buffer. If the tx
				965	* mailbox at from_msg is configured (i.e. from_msg != NULL) then it can
				966	* be safely accessed after releasing the lock since the tx mailbox
				967	* address can only be configured once.
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	968	*/
				969	sl_lock(&from->lock);
				970	from_msg = from->mailbox.send;
				971	sl_unlock(&from->lock);
				972
				973	if (from_msg == NULL) {
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	974	return spci_error(SPCI_INVALID_PARAMETERS);
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	975	}
				976
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	977	/* Ensure the receiver VM exists. */
				978	to = vm_find(receiver_vm_id);
Jose Marinho	a1dfeda	2019-02-27 16:46:03 +0000	[diff] [blame]	979	if (to == NULL) {
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	980	return spci_error(SPCI_INVALID_PARAMETERS);
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	981	}
				982
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	983	/*
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	984	* Hafnium needs to hold the lock on <to> before the mailbox state is
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	985	* checked. The lock on <to> must be held until the information is
				986	* copied to <to> Rx buffer. Since in
				987	* spci_msg_handle_architected_message we may call api_spci_share_memory
				988	* which must hold the <from> lock, we must hold the <from> lock at this
				989	* point to prevent a deadlock scenario.
				990	*/
Andrew Walbran	f659596	2019-10-15 16:47:56 +0100	[diff] [blame]	991	vm_to_from_lock = vm_lock_both(to, from);
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	992
Andrew Walbran	e0f575f	2019-10-16 16:00:12 +0100	[diff] [blame]	993	if (msg_receiver_busy(vm_to_from_lock.vm1, vm_to_from_lock.vm2,
				994	notify)) {
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	995	ret = spci_error(SPCI_BUSY);
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	996	goto out;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	997	}
				998
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	999	/* Handle legacy memory sharing messages. */
				1000	if ((attributes & SPCI_MSG_SEND_LEGACY_MEMORY_MASK) ==
				1001	SPCI_MSG_SEND_LEGACY_MEMORY) {
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1002	/*
				1003	* Buffer holding the internal copy of the shared memory
				1004	* regions.
				1005	*/
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1006	struct spci_architected_message_header
				1007	*architected_message_replica =
				1008	(struct spci_architected_message_header *)
				1009	cpu_get_buffer(current->cpu->id);
Jose Marinho	20713fa	2019-08-07 15:42:07 +0100	[diff] [blame]	1010	uint32_t message_buffer_size =
				1011	cpu_get_buffer_size(current->cpu->id);
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1012
				1013	struct spci_architected_message_header *architected_header =
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1014	(struct spci_architected_message_header *)from_msg;
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1015
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1016	if (size > message_buffer_size) {
				1017	ret = spci_error(SPCI_INVALID_PARAMETERS);
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1018	goto out;
				1019	}
				1020
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1021	if (size < sizeof(struct spci_architected_message_header)) {
				1022	ret = spci_error(SPCI_INVALID_PARAMETERS);
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1023	goto out;
				1024	}
				1025
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1026	/* Copy the architected message into the internal buffer. */
				1027	memcpy_s(architected_message_replica, message_buffer_size,
				1028	architected_header, size);
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1029
				1030	/*
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1031	* Note that architected_message_replica is passed as the third
				1032	* parameter to spci_msg_handle_architected_message. The
				1033	* execution flow commencing at
				1034	* spci_msg_handle_architected_message will make several
				1035	* accesses to fields in architected_message_replica. The memory
				1036	* area architected_message_replica must be exclusively owned by
				1037	* Hafnium so that TOCTOU issues do not arise.
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1038	*/
				1039	ret = spci_msg_handle_architected_message(
Andrew Walbran	f659596	2019-10-15 16:47:56 +0100	[diff] [blame]	1040	vm_to_from_lock.vm1, vm_to_from_lock.vm2,
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1041	architected_message_replica, size);
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1042
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1043	if (ret.func != SPCI_SUCCESS_32) {
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1044	goto out;
				1045	}
				1046	} else {
				1047	/* Copy data. */
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1048	memcpy_s(to->mailbox.recv, SPCI_MSG_PAYLOAD_MAX, from_msg,
				1049	size);
				1050	to->mailbox.recv_size = size;
				1051	to->mailbox.recv_sender = sender_vm_id;
				1052	to->mailbox.recv_attributes = 0;
				1053	ret = (struct spci_value){.func = SPCI_SUCCESS_32};
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1054	}
				1055
Andrew Walbran	e0f575f	2019-10-16 16:00:12 +0100	[diff] [blame]	1056	deliver_msg(vm_to_from_lock.vm1, vm_to_from_lock.vm2, size, current,
				1057	next);
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	1058
				1059	out:
Andrew Walbran	f659596	2019-10-15 16:47:56 +0100	[diff] [blame]	1060	vm_unlock(&vm_to_from_lock.vm1);
				1061	vm_unlock(&vm_to_from_lock.vm2);
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1062
Wedson Almeida Filho	80eb4a3	2018-11-30 17:11:15 +0000	[diff] [blame]	1063	return ret;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1064	}
				1065
				1066	/**
Andrew Scull	ec52ddf	2019-08-20 10:41:01 +0100	[diff] [blame]	1067	* Checks whether the vCPU's attempt to block for a message has already been
				1068	* interrupted or whether it is allowed to block.
				1069	*/
				1070	bool api_spci_msg_recv_block_interrupted(struct vcpu *current)
				1071	{
				1072	bool interrupted;
				1073
				1074	sl_lock(&current->lock);
				1075
				1076	/*
				1077	* Don't block if there are enabled and pending interrupts, to match
				1078	* behaviour of wait_for_interrupt.
				1079	*/
				1080	interrupted = (current->interrupts.enabled_and_pending_count > 0);
				1081
				1082	sl_unlock(&current->lock);
				1083
				1084	return interrupted;
				1085	}
				1086
				1087	/**
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	1088	* Receives a message from the mailbox. If one isn't available, this function
				1089	* can optionally block the caller until one becomes available.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1090	*
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	1091	* No new messages can be received until the mailbox has been cleared.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1092	*/
Andrew Walbran	d4d2fa1	2019-10-01 16:47:25 +0100	[diff] [blame]	1093	struct spci_value api_spci_msg_recv(bool block, struct vcpu *current,
				1094	struct vcpu **next)
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1095	{
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	1096	struct vm *vm = current->vm;
Andrew Walbran	d4d2fa1	2019-10-01 16:47:25 +0100	[diff] [blame]	1097	struct spci_value return_code;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1098
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	1099	/*
				1100	* The primary VM will receive messages as a status code from running
				1101	* vcpus and must not call this function.
				1102	*/
Andrew Scull	1950326	2018-09-20 14:48:39 +0100	[diff] [blame]	1103	if (vm->id == HF_PRIMARY_VM_ID) {
Andrew Walbran	d4d2fa1	2019-10-01 16:47:25 +0100	[diff] [blame]	1104	return spci_error(SPCI_NOT_SUPPORTED);
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1105	}
				1106
				1107	sl_lock(&vm->lock);
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1108
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	1109	/* Return pending messages without blocking. */
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	1110	if (vm->mailbox.state == MAILBOX_STATE_RECEIVED) {
				1111	vm->mailbox.state = MAILBOX_STATE_READ;
Andrew Walbran	d4d2fa1	2019-10-01 16:47:25 +0100	[diff] [blame]	1112	return_code = spci_msg_recv_return(vm);
Jose Marinho	3e2442f	2019-03-12 13:30:37 +0000	[diff] [blame]	1113	goto out;
				1114	}
				1115
				1116	/* No pending message so fail if not allowed to block. */
				1117	if (!block) {
Andrew Walbran	d4d2fa1	2019-10-01 16:47:25 +0100	[diff] [blame]	1118	return_code = spci_error(SPCI_RETRY);
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	1119	goto out;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1120	}
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	1121
Andrew Walbran	9311c9a	2019-03-12 16:59:04 +0000	[diff] [blame]	1122	/*
Jose Marinho	3e2442f	2019-03-12 13:30:37 +0000	[diff] [blame]	1123	* From this point onward this call can only be interrupted or a message
				1124	* received. If a message is received the return value will be set at
				1125	* that time to SPCI_SUCCESS.
Andrew Walbran	9311c9a	2019-03-12 16:59:04 +0000	[diff] [blame]	1126	*/
Andrew Walbran	d4d2fa1	2019-10-01 16:47:25 +0100	[diff] [blame]	1127	return_code = spci_error(SPCI_INTERRUPTED);
Andrew Scull	ec52ddf	2019-08-20 10:41:01 +0100	[diff] [blame]	1128	if (api_spci_msg_recv_block_interrupted(current)) {
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	1129	goto out;
				1130	}
				1131
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	1132	/* Switch back to primary vm to block. */
Andrew Walbran	b481655	2018-12-05 17:35:42 +0000	[diff] [blame]	1133	{
Andrew Walbran	7a1ea0b	2019-10-02 18:18:44 +0100	[diff] [blame]	1134	struct spci_value run_return = {
				1135	.func = SPCI_MSG_WAIT_32,
				1136	.arg1 = ((uint32_t)vcpu_index(current) << 16) \| vm->id,
Andrew Walbran	b481655	2018-12-05 17:35:42 +0000	[diff] [blame]	1137	};
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1138
Andrew Walbran	b481655	2018-12-05 17:35:42 +0000	[diff] [blame]	1139	*next = api_switch_to_primary(current, run_return,
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	1140	VCPU_STATE_BLOCKED_MAILBOX);
Andrew Walbran	b481655	2018-12-05 17:35:42 +0000	[diff] [blame]	1141	}
Andrew Scull	aa039b3	2018-10-04 15:02:26 +0100	[diff] [blame]	1142	out:
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1143	sl_unlock(&vm->lock);
				1144
Jose Marinho	3e2442f	2019-03-12 13:30:37 +0000	[diff] [blame]	1145	return return_code;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1146	}
				1147
				1148	/**
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1149	* Retrieves the next VM whose mailbox became writable. For a VM to be notified
				1150	* by this function, the caller must have called api_mailbox_send before with
				1151	* the notify argument set to true, and this call must have failed because the
				1152	* mailbox was not available.
				1153	*
				1154	* It should be called repeatedly to retrieve a list of VMs.
				1155	*
				1156	* Returns -1 if no VM became writable, or the id of the VM whose mailbox
				1157	* became writable.
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1158	*/
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1159	int64_t api_mailbox_writable_get(const struct vcpu *current)
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1160	{
Wedson Almeida Filho	00df6c7	2018-10-18 11:19:24 +0100	[diff] [blame]	1161	struct vm *vm = current->vm;
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1162	struct wait_entry *entry;
Andrew Scull	c0e569a	2018-10-02 18:05:21 +0100	[diff] [blame]	1163	int64_t ret;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1164
				1165	sl_lock(&vm->lock);
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1166	if (list_empty(&vm->mailbox.ready_list)) {
				1167	ret = -1;
				1168	goto exit;
				1169	}
				1170
				1171	entry = CONTAINER_OF(vm->mailbox.ready_list.next, struct wait_entry,
				1172	ready_links);
				1173	list_remove(&entry->ready_links);
Wedson Almeida Filho	b790f65	2019-01-22 23:41:56 +0000	[diff] [blame]	1174	ret = entry - vm->wait_entries;
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1175
				1176	exit:
				1177	sl_unlock(&vm->lock);
				1178	return ret;
				1179	}
				1180
				1181	/**
				1182	* Retrieves the next VM waiting to be notified that the mailbox of the
				1183	* specified VM became writable. Only primary VMs are allowed to call this.
				1184	*
Wedson Almeida Filho	b790f65	2019-01-22 23:41:56 +0000	[diff] [blame]	1185	* Returns -1 on failure or if there are no waiters; the VM id of the next
				1186	* waiter otherwise.
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1187	*/
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1188	int64_t api_mailbox_waiter_get(spci_vm_id_t vm_id, const struct vcpu *current)
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1189	{
				1190	struct vm *vm;
				1191	struct vm_locked locked;
				1192	struct wait_entry *entry;
				1193	struct vm *waiting_vm;
				1194
				1195	/* Only primary VMs are allowed to call this function. */
				1196	if (current->vm->id != HF_PRIMARY_VM_ID) {
				1197	return -1;
				1198	}
				1199
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1200	vm = vm_find(vm_id);
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1201	if (vm == NULL) {
				1202	return -1;
				1203	}
				1204
				1205	/* Check if there are outstanding notifications from given vm. */
Andrew Walbran	7e932bd	2019-04-29 16:47:06 +0100	[diff] [blame]	1206	locked = vm_lock(vm);
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1207	entry = api_fetch_waiter(locked);
				1208	vm_unlock(&locked);
				1209
				1210	if (entry == NULL) {
				1211	return -1;
				1212	}
				1213
				1214	/* Enqueue notification to waiting VM. */
				1215	waiting_vm = entry->waiting_vm;
				1216
				1217	sl_lock(&waiting_vm->lock);
				1218	if (list_empty(&entry->ready_links)) {
				1219	list_append(&waiting_vm->mailbox.ready_list,
				1220	&entry->ready_links);
				1221	}
				1222	sl_unlock(&waiting_vm->lock);
				1223
				1224	return waiting_vm->id;
				1225	}
				1226
				1227	/**
				1228	* Clears the caller's mailbox so that a new message can be received. The caller
				1229	* must have copied out all data they wish to preserve as new messages will
				1230	* overwrite the old and will arrive asynchronously.
				1231	*
				1232	* Returns:
Andrew Scull	aa7db8e	2019-02-01 14:12:19 +0000	[diff] [blame]	1233	* - -1 on failure, if the mailbox hasn't been read.
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1234	* - 0 on success if no further action is needed.
				1235	* - 1 if it was called by the primary VM and the primary VM now needs to wake
				1236	* up or kick waiters. Waiters should be retrieved by calling
				1237	* hf_mailbox_waiter_get.
				1238	*/
				1239	int64_t api_mailbox_clear(struct vcpu current, struct vcpu *next)
				1240	{
				1241	struct vm *vm = current->vm;
				1242	struct vm_locked locked;
				1243	int64_t ret;
				1244
Andrew Walbran	7e932bd	2019-04-29 16:47:06 +0100	[diff] [blame]	1245	locked = vm_lock(vm);
Andrew Scull	aa7db8e	2019-02-01 14:12:19 +0000	[diff] [blame]	1246	switch (vm->mailbox.state) {
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	1247	case MAILBOX_STATE_EMPTY:
Andrew Scull	aa7db8e	2019-02-01 14:12:19 +0000	[diff] [blame]	1248	ret = 0;
				1249	break;
				1250
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	1251	case MAILBOX_STATE_RECEIVED:
Andrew Scull	aa7db8e	2019-02-01 14:12:19 +0000	[diff] [blame]	1252	ret = -1;
				1253	break;
				1254
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	1255	case MAILBOX_STATE_READ:
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1256	ret = api_waiter_result(locked, current, next);
Andrew Scull	d6ee110	2019-04-05 22:12:42 +0100	[diff] [blame]	1257	vm->mailbox.state = MAILBOX_STATE_EMPTY;
Andrew Scull	aa7db8e	2019-02-01 14:12:19 +0000	[diff] [blame]	1258	break;
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1259	}
Wedson Almeida Filho	ea62e2e	2019-01-09 19:14:59 +0000	[diff] [blame]	1260	vm_unlock(&locked);
Wedson Almeida Filho	2f94ec1	2018-07-26 16:00:48 +0100	[diff] [blame]	1261
				1262	return ret;
Wedson Almeida Filho	3fcbcff	2018-07-10 23:53:39 +0100	[diff] [blame]	1263	}
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1264
				1265	/**
				1266	* Enables or disables a given interrupt ID for the calling vCPU.
				1267	*
				1268	* Returns 0 on success, or -1 if the intid is invalid.
				1269	*/
Wedson Almeida Filho	c559d13	2019-01-09 19:33:40 +0000	[diff] [blame]	1270	int64_t api_interrupt_enable(uint32_t intid, bool enable, struct vcpu *current)
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1271	{
				1272	uint32_t intid_index = intid / INTERRUPT_REGISTER_BITS;
Andrew Walbran	e52006c	2019-10-22 18:01:28 +0100	[diff] [blame]	1273	uint32_t intid_mask = 1U << (intid % INTERRUPT_REGISTER_BITS);
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1274
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1275	if (intid >= HF_NUM_INTIDS) {
				1276	return -1;
				1277	}
				1278
				1279	sl_lock(&current->lock);
				1280	if (enable) {
Andrew Walbran	3d84a26	2018-12-13 14:41:19 +0000	[diff] [blame]	1281	/*
				1282	* If it is pending and was not enabled before, increment the
				1283	* count.
				1284	*/
				1285	if (current->interrupts.interrupt_pending[intid_index] &
				1286	~current->interrupts.interrupt_enabled[intid_index] &
				1287	intid_mask) {
				1288	current->interrupts.enabled_and_pending_count++;
				1289	}
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1290	current->interrupts.interrupt_enabled[intid_index] \|=
				1291	intid_mask;
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1292	} else {
Andrew Walbran	3d84a26	2018-12-13 14:41:19 +0000	[diff] [blame]	1293	/*
				1294	* If it is pending and was enabled before, decrement the count.
				1295	*/
				1296	if (current->interrupts.interrupt_pending[intid_index] &
				1297	current->interrupts.interrupt_enabled[intid_index] &
				1298	intid_mask) {
				1299	current->interrupts.enabled_and_pending_count--;
				1300	}
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1301	current->interrupts.interrupt_enabled[intid_index] &=
				1302	~intid_mask;
				1303	}
				1304
				1305	sl_unlock(&current->lock);
				1306	return 0;
				1307	}
				1308
				1309	/**
				1310	* Returns the ID of the next pending interrupt for the calling vCPU, and
				1311	* acknowledges it (i.e. marks it as no longer pending). Returns
				1312	* HF_INVALID_INTID if there are no pending interrupts.
				1313	*/
Wedson Almeida Filho	c559d13	2019-01-09 19:33:40 +0000	[diff] [blame]	1314	uint32_t api_interrupt_get(struct vcpu *current)
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1315	{
				1316	uint8_t i;
				1317	uint32_t first_interrupt = HF_INVALID_INTID;
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1318
				1319	/*
				1320	* Find the first enabled and pending interrupt ID, return it, and
				1321	* deactivate it.
				1322	*/
				1323	sl_lock(&current->lock);
				1324	for (i = 0; i < HF_NUM_INTIDS / INTERRUPT_REGISTER_BITS; ++i) {
				1325	uint32_t enabled_and_pending =
				1326	current->interrupts.interrupt_enabled[i] &
				1327	current->interrupts.interrupt_pending[i];
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1328
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1329	if (enabled_and_pending != 0) {
Andrew Walbran	3d84a26	2018-12-13 14:41:19 +0000	[diff] [blame]	1330	uint8_t bit_index = ctz(enabled_and_pending);
				1331	/*
				1332	* Mark it as no longer pending and decrement the count.
				1333	*/
				1334	current->interrupts.interrupt_pending[i] &=
Andrew Walbran	e52006c	2019-10-22 18:01:28 +0100	[diff] [blame]	1335	~(1U << bit_index);
Andrew Walbran	3d84a26	2018-12-13 14:41:19 +0000	[diff] [blame]	1336	current->interrupts.enabled_and_pending_count--;
				1337	first_interrupt =
				1338	i * INTERRUPT_REGISTER_BITS + bit_index;
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1339	break;
				1340	}
				1341	}
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1342
				1343	sl_unlock(&current->lock);
				1344	return first_interrupt;
				1345	}
				1346
				1347	/**
Andrew Walbran	4cf217a	2018-12-14 15:24:50 +0000	[diff] [blame]	1348	* Returns whether the current vCPU is allowed to inject an interrupt into the
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1349	* given VM and vCPU.
				1350	*/
				1351	static inline bool is_injection_allowed(uint32_t target_vm_id,
				1352	struct vcpu *current)
				1353	{
				1354	uint32_t current_vm_id = current->vm->id;
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1355
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1356	/*
				1357	* The primary VM is allowed to inject interrupts into any VM. Secondary
				1358	* VMs are only allowed to inject interrupts into their own vCPUs.
				1359	*/
				1360	return current_vm_id == HF_PRIMARY_VM_ID \|\|
				1361	current_vm_id == target_vm_id;
				1362	}
				1363
				1364	/**
				1365	* Injects a virtual interrupt of the given ID into the given target vCPU.
				1366	* This doesn't cause the vCPU to actually be run immediately; it will be taken
				1367	* when the vCPU is next run, which is up to the scheduler.
				1368	*
Andrew Walbran	3d84a26	2018-12-13 14:41:19 +0000	[diff] [blame]	1369	* Returns:
				1370	* - -1 on failure because the target VM or vCPU doesn't exist, the interrupt
				1371	* ID is invalid, or the current VM is not allowed to inject interrupts to
				1372	* the target VM.
				1373	* - 0 on success if no further action is needed.
				1374	* - 1 if it was called by the primary VM and the primary VM now needs to wake
				1375	* up or kick the target vCPU.
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1376	*/
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1377	int64_t api_interrupt_inject(spci_vm_id_t target_vm_id,
Andrew Walbran	b037d5b	2019-06-25 17:19:41 +0100	[diff] [blame]	1378	spci_vcpu_index_t target_vcpu_idx, uint32_t intid,
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1379	struct vcpu current, struct vcpu *next)
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1380	{
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1381	struct vcpu *target_vcpu;
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1382	struct vm *target_vm = vm_find(target_vm_id);
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1383
				1384	if (intid >= HF_NUM_INTIDS) {
				1385	return -1;
				1386	}
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1387
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1388	if (target_vm == NULL) {
				1389	return -1;
				1390	}
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1391
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1392	if (target_vcpu_idx >= target_vm->vcpu_count) {
				1393	/* The requested vcpu must exist. */
				1394	return -1;
				1395	}
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1396
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1397	if (!is_injection_allowed(target_vm_id, current)) {
				1398	return -1;
				1399	}
Wedson Almeida Filho	81568c4	2019-01-04 13:33:02 +0000	[diff] [blame]	1400
Andrew Walbran	e1310df	2019-04-29 17:28:28 +0100	[diff] [blame]	1401	target_vcpu = vm_get_vcpu(target_vm, target_vcpu_idx);
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1402
				1403	dlog("Injecting IRQ %d for VM %d VCPU %d from VM %d VCPU %d\n", intid,
				1404	target_vm_id, target_vcpu_idx, current->vm->id, current->cpu->id);
Andrew Walbran	fc9d438	2019-05-10 18:07:21 +0100	[diff] [blame]	1405	return internal_interrupt_inject(target_vcpu, intid, current, next);
Andrew Walbran	318f573	2018-11-20 16:23:42 +0000	[diff] [blame]	1406	}
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1407
				1408	/**
				1409	* Clears a region of physical memory by overwriting it with zeros. The data is
				1410	* flushed from the cache so the memory has been cleared across the system.
				1411	*/
				1412	static bool api_clear_memory(paddr_t begin, paddr_t end, struct mpool *ppool)
				1413	{
				1414	/*
				1415	* TODO: change this to a cpu local single page window rather than a
				1416	* global mapping of the whole range. Such an approach will limit
				1417	* the changes to stage-1 tables and will allow only local
				1418	* invalidation.
				1419	*/
Andrew Scull	3c0a90a	2019-07-01 11:55:53 +0100	[diff] [blame]	1420	bool ret;
				1421	struct mm_stage1_locked stage1_locked = mm_lock_stage1();
				1422	void *ptr =
				1423	mm_identity_map(stage1_locked, begin, end, MM_MODE_W, ppool);
Andrew Walbran	2cb4339	2019-04-17 12:52:45 +0100	[diff] [blame]	1424	size_t size = pa_difference(begin, end);
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1425
				1426	if (!ptr) {
				1427	/* TODO: partial defrag of failed range. */
				1428	/* Recover any memory consumed in failed mapping. */
Andrew Scull	3c0a90a	2019-07-01 11:55:53 +0100	[diff] [blame]	1429	mm_defrag(stage1_locked, ppool);
				1430	goto fail;
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1431	}
				1432
Andrew Scull	2b5fbad	2019-04-05 13:55:56 +0100	[diff] [blame]	1433	memset_s(ptr, size, 0, size);
Andrew Scull	c059fbe	2019-09-12 12:58:40 +0100	[diff] [blame]	1434	arch_mm_flush_dcache(ptr, size);
Andrew Scull	3c0a90a	2019-07-01 11:55:53 +0100	[diff] [blame]	1435	mm_unmap(stage1_locked, begin, end, ppool);
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1436
Andrew Scull	3c0a90a	2019-07-01 11:55:53 +0100	[diff] [blame]	1437	ret = true;
				1438	goto out;
				1439
				1440	fail:
				1441	ret = false;
				1442
				1443	out:
				1444	mm_unlock_stage1(&stage1_locked);
				1445
				1446	return ret;
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1447	}
				1448
Andrew Walbran	e0f575f	2019-10-16 16:00:12 +0100	[diff] [blame]	1449	/** TODO: Move function to spci_architected_message.c. */
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1450	/**
				1451	* Shares memory from the calling VM with another. The memory can be shared in
				1452	* different modes.
				1453	*
				1454	* This function requires the calling context to hold the <to> and <from> locks.
				1455	*
				1456	* Returns:
				1457	* In case of error one of the following values is returned:
				1458	* 1) SPCI_INVALID_PARAMETERS - The endpoint provided parameters were
				1459	* erroneous;
Andrew Walbran	379aa72	2019-10-07 14:16:34 +0100	[diff] [blame]	1460	* 2) SPCI_NO_MEMORY - Hafnium did not have sufficient memory to complete
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1461	* the request.
				1462	* Success is indicated by SPCI_SUCCESS.
				1463	*/
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1464	struct spci_value api_spci_share_memory(
				1465	struct vm_locked to_locked, struct vm_locked from_locked,
				1466	struct spci_memory_region *memory_region, uint32_t memory_to_attributes,
				1467	enum spci_memory_share share)
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1468	{
				1469	struct vm *to = to_locked.vm;
				1470	struct vm *from = from_locked.vm;
Andrew Walbran	1281ed4	2019-10-22 17:23:40 +0100	[diff] [blame]	1471	uint32_t orig_from_mode;
				1472	uint32_t from_mode;
				1473	uint32_t to_mode;
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1474	struct mpool local_page_pool;
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1475	struct spci_value ret;
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1476	paddr_t pa_begin;
				1477	paddr_t pa_end;
				1478	ipaddr_t begin;
				1479	ipaddr_t end;
Andrew Walbran	f597218	2019-10-15 15:41:26 +0100	[diff] [blame]	1480	struct spci_memory_region_constituent *constituents =
				1481	spci_memory_region_get_constituents(memory_region);
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1482
				1483	size_t size;
				1484
				1485	/* Disallow reflexive shares as this suggests an error in the VM. */
				1486	if (to == from) {
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1487	return spci_error(SPCI_INVALID_PARAMETERS);
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1488	}
				1489
				1490	/*
				1491	* Create a local pool so any freed memory can't be used by another
				1492	* thread. This is to ensure the original mapping can be restored if any
				1493	* stage of the process fails.
				1494	*/
				1495	mpool_init_with_fallback(&local_page_pool, &api_page_pool);
				1496
				1497	/* Obtain the single contiguous set of pages from the memory_region. */
				1498	/* TODO: Add support for multiple constituent regions. */
Andrew Walbran	f597218	2019-10-15 15:41:26 +0100	[diff] [blame]	1499	size = constituents[0].page_count * PAGE_SIZE;
				1500	begin = ipa_init(constituents[0].address);
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1501	end = ipa_add(begin, size);
				1502
				1503	/*
				1504	* Check if the state transition is lawful for both VMs involved
				1505	* in the memory exchange, ensure that all constituents of a memory
				1506	* region being shared are at the same state.
				1507	*/
				1508	if (!spci_msg_check_transition(to, from, share, &orig_from_mode, begin,
				1509	end, memory_to_attributes, &from_mode,
				1510	&to_mode)) {
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1511	return spci_error(SPCI_INVALID_PARAMETERS);
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1512	}
				1513
				1514	pa_begin = pa_from_ipa(begin);
				1515	pa_end = pa_from_ipa(end);
				1516
				1517	/*
				1518	* First update the mapping for the sender so there is not overlap with
				1519	* the recipient.
				1520	*/
				1521	if (!mm_vm_identity_map(&from->ptable, pa_begin, pa_end, from_mode,
				1522	NULL, &local_page_pool)) {
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1523	ret = spci_error(SPCI_NO_MEMORY);
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1524	goto out;
				1525	}
				1526
				1527	/* Complete the transfer by mapping the memory into the recipient. */
				1528	if (!mm_vm_identity_map(&to->ptable, pa_begin, pa_end, to_mode, NULL,
				1529	&local_page_pool)) {
				1530	/* TODO: partial defrag of failed range. */
				1531	/* Recover any memory consumed in failed mapping. */
				1532	mm_vm_defrag(&from->ptable, &local_page_pool);
				1533
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1534	ret = spci_error(SPCI_NO_MEMORY);
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1535
				1536	CHECK(mm_vm_identity_map(&from->ptable, pa_begin, pa_end,
				1537	orig_from_mode, NULL,
				1538	&local_page_pool));
				1539
				1540	goto out;
				1541	}
				1542
Andrew Walbran	70bc862	2019-10-07 14:15:58 +0100	[diff] [blame]	1543	ret = (struct spci_value){.func = SPCI_SUCCESS_32};
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1544
				1545	out:
Jose Marinho	75509b4	2019-04-09 09:34:59 +0100	[diff] [blame]	1546	mpool_fini(&local_page_pool);
				1547
				1548	return ret;
				1549	}
				1550
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1551	/**
				1552	* Shares memory from the calling VM with another. The memory can be shared in
				1553	* different modes.
				1554	*
				1555	* TODO: the interface for sharing memory will need to be enhanced to allow
				1556	* sharing with different modes e.g. read-only, informing the recipient
				1557	* of the memory they have been given, opting to not wipe the memory and
				1558	* possibly allowing multiple blocks to be transferred. What this will
				1559	* look like is TBD.
				1560	*/
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1561	int64_t api_share_memory(spci_vm_id_t vm_id, ipaddr_t addr, size_t size,
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1562	enum hf_share share, struct vcpu *current)
				1563	{
				1564	struct vm *from = current->vm;
				1565	struct vm *to;
Andrew Walbran	1281ed4	2019-10-22 17:23:40 +0100	[diff] [blame]	1566	uint32_t orig_from_mode;
				1567	uint32_t from_mode;
				1568	uint32_t to_mode;
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1569	ipaddr_t begin;
				1570	ipaddr_t end;
				1571	paddr_t pa_begin;
				1572	paddr_t pa_end;
				1573	struct mpool local_page_pool;
				1574	int64_t ret;
				1575
				1576	/* Disallow reflexive shares as this suggests an error in the VM. */
				1577	if (vm_id == from->id) {
				1578	return -1;
				1579	}
				1580
				1581	/* Ensure the target VM exists. */
Andrew Walbran	42347a9	2019-05-09 13:59:03 +0100	[diff] [blame]	1582	to = vm_find(vm_id);
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1583	if (to == NULL) {
				1584	return -1;
				1585	}
				1586
				1587	begin = addr;
				1588	end = ipa_add(addr, size);
				1589
				1590	/* Fail if addresses are not page-aligned. */
Alfredo Mazzinghi	eb1997c	2019-02-07 18:00:01 +0000	[diff] [blame]	1591	if (!is_aligned(ipa_addr(begin), PAGE_SIZE) \|\|
				1592	!is_aligned(ipa_addr(end), PAGE_SIZE)) {
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1593	return -1;
				1594	}
				1595
				1596	/* Convert the sharing request to memory management modes. */
				1597	switch (share) {
				1598	case HF_MEMORY_GIVE:
				1599	from_mode = MM_MODE_INVALID \| MM_MODE_UNOWNED;
				1600	to_mode = MM_MODE_R \| MM_MODE_W \| MM_MODE_X;
				1601	break;
				1602
				1603	case HF_MEMORY_LEND:
				1604	from_mode = MM_MODE_INVALID;
				1605	to_mode = MM_MODE_R \| MM_MODE_W \| MM_MODE_X \| MM_MODE_UNOWNED;
				1606	break;
				1607
				1608	case HF_MEMORY_SHARE:
				1609	from_mode = MM_MODE_R \| MM_MODE_W \| MM_MODE_X \| MM_MODE_SHARED;
				1610	to_mode = MM_MODE_R \| MM_MODE_W \| MM_MODE_X \| MM_MODE_UNOWNED \|
				1611	MM_MODE_SHARED;
				1612	break;
				1613
				1614	default:
				1615	/* The input is untrusted so might not be a valid value. */
				1616	return -1;
				1617	}
				1618
				1619	/*
				1620	* Create a local pool so any freed memory can't be used by another
				1621	* thread. This is to ensure the original mapping can be restored if any
				1622	* stage of the process fails.
				1623	*/
				1624	mpool_init_with_fallback(&local_page_pool, &api_page_pool);
				1625
				1626	sl_lock_both(&from->lock, &to->lock);
				1627
				1628	/*
				1629	* Ensure that the memory range is mapped with the same mode so that
				1630	* changes can be reverted if the process fails.
				1631	*/
				1632	if (!mm_vm_get_mode(&from->ptable, begin, end, &orig_from_mode)) {
				1633	goto fail;
				1634	}
				1635
Andrew Scull	b5f49e0	2019-10-02 13:20:47 +0100	[diff] [blame]	1636	/* Ensure the address range is normal memory and not a device. */
				1637	if (orig_from_mode & MM_MODE_D) {
				1638	goto fail;
				1639	}
				1640
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1641	/*
				1642	* Ensure the memory range is valid for the sender. If it isn't, the
				1643	* sender has either shared it with another VM already or has no claim
				1644	* to the memory.
				1645	*/
				1646	if (orig_from_mode & MM_MODE_INVALID) {
				1647	goto fail;
				1648	}
				1649
				1650	/*
				1651	* The sender must own the memory and have exclusive access to it in
				1652	* order to share it. Alternatively, it is giving memory back to the
				1653	* owning VM.
				1654	*/
				1655	if (orig_from_mode & MM_MODE_UNOWNED) {
Andrew Walbran	1281ed4	2019-10-22 17:23:40 +0100	[diff] [blame]	1656	uint32_t orig_to_mode;
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1657
				1658	if (share != HF_MEMORY_GIVE \|\|
				1659	!mm_vm_get_mode(&to->ptable, begin, end, &orig_to_mode) \|\|
				1660	orig_to_mode & MM_MODE_UNOWNED) {
				1661	goto fail;
				1662	}
				1663	} else if (orig_from_mode & MM_MODE_SHARED) {
				1664	goto fail;
				1665	}
				1666
				1667	pa_begin = pa_from_ipa(begin);
				1668	pa_end = pa_from_ipa(end);
				1669
				1670	/*
				1671	* First update the mapping for the sender so there is not overlap with
				1672	* the recipient.
				1673	*/
				1674	if (!mm_vm_identity_map(&from->ptable, pa_begin, pa_end, from_mode,
				1675	NULL, &local_page_pool)) {
				1676	goto fail;
				1677	}
				1678
				1679	/* Clear the memory so no VM or device can see the previous contents. */
				1680	if (!api_clear_memory(pa_begin, pa_end, &local_page_pool)) {
				1681	goto fail_return_to_sender;
				1682	}
				1683
				1684	/* Complete the transfer by mapping the memory into the recipient. */
				1685	if (!mm_vm_identity_map(&to->ptable, pa_begin, pa_end, to_mode, NULL,
				1686	&local_page_pool)) {
				1687	/* TODO: partial defrag of failed range. */
				1688	/* Recover any memory consumed in failed mapping. */
				1689	mm_vm_defrag(&from->ptable, &local_page_pool);
				1690	goto fail_return_to_sender;
				1691	}
				1692
				1693	ret = 0;
				1694	goto out;
				1695
				1696	fail_return_to_sender:
Andrew Scull	7e8de32	2019-07-02 13:00:56 +0100	[diff] [blame]	1697	CHECK(mm_vm_identity_map(&from->ptable, pa_begin, pa_end,
				1698	orig_from_mode, NULL, &local_page_pool));
Andrew Scull	6386f25	2018-12-06 13:29:10 +0000	[diff] [blame]	1699
				1700	fail:
				1701	ret = -1;
				1702
				1703	out:
				1704	sl_unlock(&from->lock);
				1705	sl_unlock(&to->lock);
				1706
				1707	mpool_fini(&local_page_pool);
				1708
				1709	return ret;
				1710	}
Jose Marinho	fc0b2b6	2019-06-06 11:18:45 +0100	[diff] [blame]	1711
				1712	/** Returns the version of the implemented SPCI specification. */
Andrew Walbran	7f920af	2019-09-03 17:09:30 +0100	[diff] [blame]	1713	struct spci_value api_spci_version(void)
Jose Marinho	fc0b2b6	2019-06-06 11:18:45 +0100	[diff] [blame]	1714	{
				1715	/*
				1716	* Ensure that both major and minor revision representation occupies at
				1717	* most 15 bits.
				1718	*/
				1719	static_assert(0x8000 > SPCI_VERSION_MAJOR,
				1720	"Major revision representation take more than 15 bits.");
				1721	static_assert(0x10000 > SPCI_VERSION_MINOR,
				1722	"Minor revision representation take more than 16 bits.");
				1723
Andrew Walbran	7f920af	2019-09-03 17:09:30 +0100	[diff] [blame]	1724	struct spci_value ret = {
				1725	.func = SPCI_SUCCESS_32,
Andrew Walbran	455c53a	2019-10-10 13:56:19 +0100	[diff] [blame]	1726	.arg2 = (SPCI_VERSION_MAJOR << SPCI_VERSION_MAJOR_OFFSET) \|
Andrew Walbran	7f920af	2019-09-03 17:09:30 +0100	[diff] [blame]	1727	SPCI_VERSION_MINOR};
				1728	return ret;
Jose Marinho	fc0b2b6	2019-06-06 11:18:45 +0100	[diff] [blame]	1729	}
Andrew Walbran	c1ad4ce	2019-05-09 11:41:39 +0100	[diff] [blame]	1730
				1731	int64_t api_debug_log(char c, struct vcpu *current)
				1732	{
Andrew Scull	d54e1be	2019-08-20 11:09:42 +0100	[diff] [blame]	1733	bool flush;
Andrew Walbran	c1ad4ce	2019-05-09 11:41:39 +0100	[diff] [blame]	1734	struct vm *vm = current->vm;
				1735	struct vm_locked vm_locked = vm_lock(vm);
				1736
Andrew Scull	d54e1be	2019-08-20 11:09:42 +0100	[diff] [blame]	1737	if (c == '\n' \|\| c == '\0') {
				1738	flush = true;
				1739	} else {
				1740	vm->log_buffer[vm->log_buffer_length++] = c;
				1741	flush = (vm->log_buffer_length == sizeof(vm->log_buffer));
				1742	}
				1743
				1744	if (flush) {
Andrew Walbran	7f904bf	2019-07-12 16:38:38 +0100	[diff] [blame]	1745	dlog_flush_vm_buffer(vm->id, vm->log_buffer,
				1746	vm->log_buffer_length);
				1747	vm->log_buffer_length = 0;
Andrew Walbran	c1ad4ce	2019-05-09 11:41:39 +0100	[diff] [blame]	1748	}
				1749
				1750	vm_unlock(&vm_locked);
				1751
				1752	return 0;
				1753	}
Jose Marinho	c0f4ff2	2019-10-09 10:37:42 +0100	[diff] [blame]	1754
				1755	/**
				1756	* Discovery function returning information about the implementation of optional
				1757	* SPCI interfaces.
				1758	*/
				1759	struct spci_value api_spci_features(uint32_t function_id)
				1760	{
				1761	switch (function_id) {
				1762	case SPCI_ERROR_32:
				1763	case SPCI_SUCCESS_32:
				1764	case SPCI_ID_GET_32:
				1765	case SPCI_YIELD_32:
				1766	case SPCI_VERSION_32:
				1767	case SPCI_FEATURES_32:
				1768	case SPCI_MSG_SEND_32:
				1769	case SPCI_MSG_POLL_32:
				1770	case SPCI_MSG_WAIT_32:
				1771	return (struct spci_value){.func = SPCI_SUCCESS_32};
				1772	default:
				1773	return spci_error(SPCI_NOT_SUPPORTED);
				1774	}
				1775	}