blob: 90dac1949da19a7f458c6762891af15fd8665676 [file] [log] [blame]
Andrew Scull18834872018-10-12 11:48:09 +01001/*
Andrew Walbran692b3252019-03-07 15:51:31 +00002 * Copyright 2018 The Hafnium Authors.
Andrew Scull18834872018-10-12 11:48:09 +01003 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * https://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
Andrew Scull18c78fc2018-08-20 12:57:41 +010017#include "hf/api.h"
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +010018
Andrew Walbran318f5732018-11-20 16:23:42 +000019#include "hf/arch/cpu.h"
Andrew Walbran508e63c2018-12-20 17:02:37 +000020#include "hf/arch/timer.h"
Andrew Walbran318f5732018-11-20 16:23:42 +000021
Andrew Scull877ae4b2019-07-02 12:52:33 +010022#include "hf/check.h"
Andrew Walbran318f5732018-11-20 16:23:42 +000023#include "hf/dlog.h"
Andrew Scull6386f252018-12-06 13:29:10 +000024#include "hf/mm.h"
Andrew Walbranb037d5b2019-06-25 17:19:41 +010025#include "hf/spci.h"
Andrew Scull6386f252018-12-06 13:29:10 +000026#include "hf/spinlock.h"
Andrew Scull877ae4b2019-07-02 12:52:33 +010027#include "hf/static_assert.h"
Andrew Scull8d9e1212019-04-05 13:52:55 +010028#include "hf/std.h"
Andrew Scull18c78fc2018-08-20 12:57:41 +010029#include "hf/vm.h"
30
Andrew Scullf35a5c92018-08-07 18:09:46 +010031#include "vmapi/hf/call.h"
Jose Marinhoa1dfeda2019-02-27 16:46:03 +000032#include "vmapi/hf/spci.h"
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +010033
Wedson Almeida Filhoba641ef2018-12-03 04:19:44 +000034/*
35 * To eliminate the risk of deadlocks, we define a partial order for the
36 * acquisition of locks held concurrently by the same physical CPU. Our current
37 * ordering requirements are as follows:
38 *
Andrew Scullba79b0a2019-07-03 11:26:53 +010039 * vm::lock -> vcpu::lock -> mm_stage1_lock
Andrew Scull6386f252018-12-06 13:29:10 +000040 *
Andrew Scull4caadaf2019-07-03 13:13:47 +010041 * Locks of the same kind require the lock of lowest address to be locked first,
42 * see `sl_lock_both()`.
Wedson Almeida Filhoba641ef2018-12-03 04:19:44 +000043 */
44
Andrew Scullaa039b32018-10-04 15:02:26 +010045static_assert(HF_MAILBOX_SIZE == PAGE_SIZE,
Andrew Scull13652af2018-09-17 14:49:08 +010046 "Currently, a page is mapped for the send and receive buffers so "
47 "the maximum request is the size of a page.");
48
Wedson Almeida Filho9ed8da52018-12-17 16:09:11 +000049static struct mpool api_page_pool;
Wedson Almeida Filho22d5eaa2018-12-16 00:38:49 +000050
51/**
Wedson Almeida Filho81568c42019-01-04 13:33:02 +000052 * Initialises the API page pool by taking ownership of the contents of the
53 * given page pool.
Wedson Almeida Filho22d5eaa2018-12-16 00:38:49 +000054 */
55void api_init(struct mpool *ppool)
56{
Wedson Almeida Filho9ed8da52018-12-17 16:09:11 +000057 mpool_init_from(&api_page_pool, ppool);
Wedson Almeida Filho22d5eaa2018-12-16 00:38:49 +000058}
59
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +010060/**
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +010061 * Switches the physical CPU back to the corresponding vcpu of the primary VM.
Andrew Scullaa039b32018-10-04 15:02:26 +010062 *
63 * This triggers the scheduling logic to run. Run in the context of secondary VM
64 * to cause HF_VCPU_RUN to return and the primary VM to regain control of the
65 * cpu.
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +010066 */
Wedson Almeida Filho00df6c72018-10-18 11:19:24 +010067static struct vcpu *api_switch_to_primary(struct vcpu *current,
Wedson Almeida Filhoba641ef2018-12-03 04:19:44 +000068 struct hf_vcpu_run_return primary_ret,
69 enum vcpu_state secondary_state)
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +010070{
Andrew Walbran42347a92019-05-09 13:59:03 +010071 struct vm *primary = vm_find(HF_PRIMARY_VM_ID);
Andrew Walbrane1310df2019-04-29 17:28:28 +010072 struct vcpu *next = vm_get_vcpu(primary, cpu_index(current->cpu));
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +010073
Andrew Walbran508e63c2018-12-20 17:02:37 +000074 /*
75 * If the secondary is blocked but has a timer running, sleep until the
76 * timer fires rather than indefinitely.
77 */
Andrew Scullb06d1752019-02-04 10:15:48 +000078 switch (primary_ret.code) {
79 case HF_VCPU_RUN_WAIT_FOR_INTERRUPT:
80 case HF_VCPU_RUN_WAIT_FOR_MESSAGE:
81 primary_ret.sleep.ns =
82 arch_timer_enabled_current()
83 ? arch_timer_remaining_ns_current()
84 : HF_SLEEP_INDEFINITE;
85 break;
86
87 default:
88 /* Do nothing. */
89 break;
Andrew Walbran508e63c2018-12-20 17:02:37 +000090 }
91
Wedson Almeida Filho00df6c72018-10-18 11:19:24 +010092 /* Set the return value for the primary VM's call to HF_VCPU_RUN. */
Andrew Scull6d2db332018-10-10 15:28:17 +010093 arch_regs_set_retval(&next->regs,
94 hf_vcpu_run_return_encode(primary_ret));
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +010095
Wedson Almeida Filhoba641ef2018-12-03 04:19:44 +000096 /* Mark the current vcpu as waiting. */
97 sl_lock(&current->lock);
98 current->state = secondary_state;
99 sl_unlock(&current->lock);
100
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100101 return next;
102}
103
104/**
Andrew Scull33fecd32019-01-08 14:48:27 +0000105 * Returns to the primary vm and signals that the vcpu still has work to do so.
106 */
107struct vcpu *api_preempt(struct vcpu *current)
108{
109 struct hf_vcpu_run_return ret = {
110 .code = HF_VCPU_RUN_PREEMPTED,
111 };
112
Andrew Sculld6ee1102019-04-05 22:12:42 +0100113 return api_switch_to_primary(current, ret, VCPU_STATE_READY);
Andrew Scull33fecd32019-01-08 14:48:27 +0000114}
115
116/**
Andrew Scullaa039b32018-10-04 15:02:26 +0100117 * Puts the current vcpu in wait for interrupt mode, and returns to the primary
118 * vm.
119 */
Wedson Almeida Filho00df6c72018-10-18 11:19:24 +0100120struct vcpu *api_wait_for_interrupt(struct vcpu *current)
Andrew Scullaa039b32018-10-04 15:02:26 +0100121{
Andrew Scull6d2db332018-10-10 15:28:17 +0100122 struct hf_vcpu_run_return ret = {
123 .code = HF_VCPU_RUN_WAIT_FOR_INTERRUPT,
124 };
Wedson Almeida Filho81568c42019-01-04 13:33:02 +0000125
Wedson Almeida Filhoba641ef2018-12-03 04:19:44 +0000126 return api_switch_to_primary(current, ret,
Andrew Sculld6ee1102019-04-05 22:12:42 +0100127 VCPU_STATE_BLOCKED_INTERRUPT);
Andrew Scullaa039b32018-10-04 15:02:26 +0100128}
129
130/**
Andrew Walbran33645652019-04-15 12:29:31 +0100131 * Puts the current vCPU in off mode, and returns to the primary VM.
132 */
133struct vcpu *api_vcpu_off(struct vcpu *current)
134{
135 struct hf_vcpu_run_return ret = {
136 .code = HF_VCPU_RUN_WAIT_FOR_INTERRUPT,
137 };
138
139 /*
140 * Disable the timer, so the scheduler doesn't get told to call back
141 * based on it.
142 */
143 arch_timer_disable_current();
144
145 return api_switch_to_primary(current, ret, VCPU_STATE_OFF);
146}
147
148/**
Andrew Scull66d62bf2019-02-01 13:54:10 +0000149 * Returns to the primary vm to allow this cpu to be used for other tasks as the
150 * vcpu does not have work to do at this moment. The current vcpu is marked as
Jose Marinho135dff32019-02-28 10:25:57 +0000151 * ready to be scheduled again. This SPCI function always returns SPCI_SUCCESS.
Andrew Scull66d62bf2019-02-01 13:54:10 +0000152 */
Jose Marinho135dff32019-02-28 10:25:57 +0000153int32_t api_spci_yield(struct vcpu *current, struct vcpu **next)
Andrew Scull66d62bf2019-02-01 13:54:10 +0000154{
155 struct hf_vcpu_run_return ret = {
156 .code = HF_VCPU_RUN_YIELD,
157 };
158
159 if (current->vm->id == HF_PRIMARY_VM_ID) {
Andrew Scullb06d1752019-02-04 10:15:48 +0000160 /* Noop on the primary as it makes the scheduling decisions. */
Jose Marinho135dff32019-02-28 10:25:57 +0000161 return SPCI_SUCCESS;
Andrew Scull66d62bf2019-02-01 13:54:10 +0000162 }
163
Jose Marinho135dff32019-02-28 10:25:57 +0000164 *next = api_switch_to_primary(current, ret, VCPU_STATE_READY);
165
166 /* SPCI_YIELD always returns SPCI_SUCCESS. */
167 return SPCI_SUCCESS;
Andrew Scull66d62bf2019-02-01 13:54:10 +0000168}
169
170/**
Andrew Walbran33645652019-04-15 12:29:31 +0100171 * Switches to the primary so that it can switch to the target, or kick it if it
172 * is already running on a different physical CPU.
173 */
174struct vcpu *api_wake_up(struct vcpu *current, struct vcpu *target_vcpu)
175{
176 struct hf_vcpu_run_return ret = {
177 .code = HF_VCPU_RUN_WAKE_UP,
178 .wake_up.vm_id = target_vcpu->vm->id,
179 .wake_up.vcpu = vcpu_index(target_vcpu),
180 };
181 return api_switch_to_primary(current, ret, VCPU_STATE_READY);
182}
183
184/**
Andrew Scull38772ab2019-01-24 15:16:50 +0000185 * Aborts the vCPU and triggers its VM to abort fully.
Andrew Scull9726c252019-01-23 13:44:19 +0000186 */
187struct vcpu *api_abort(struct vcpu *current)
188{
189 struct hf_vcpu_run_return ret = {
190 .code = HF_VCPU_RUN_ABORTED,
191 };
192
193 dlog("Aborting VM %u vCPU %u\n", current->vm->id, vcpu_index(current));
194
195 if (current->vm->id == HF_PRIMARY_VM_ID) {
196 /* TODO: what to do when the primary aborts? */
197 for (;;) {
198 /* Do nothing. */
199 }
200 }
201
202 atomic_store_explicit(&current->vm->aborting, true,
203 memory_order_relaxed);
204
205 /* TODO: free resources once all vCPUs abort. */
206
Andrew Sculld6ee1102019-04-05 22:12:42 +0100207 return api_switch_to_primary(current, ret, VCPU_STATE_ABORTED);
Andrew Scull9726c252019-01-23 13:44:19 +0000208}
209
210/**
Andrew Scull55c4d8b2018-12-18 18:50:18 +0000211 * Returns the ID of the VM.
212 */
Andrew Walbranfc6cd9d2019-06-25 15:23:27 +0100213spci_vm_id_t api_vm_get_id(const struct vcpu *current)
Andrew Scull55c4d8b2018-12-18 18:50:18 +0000214{
215 return current->vm->id;
216}
217
218/**
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100219 * Returns the number of VMs configured to run.
220 */
Andrew Walbran52d99672019-06-25 15:51:11 +0100221spci_vm_count_t api_vm_get_count(void)
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100222{
Andrew Scull19503262018-09-20 14:48:39 +0100223 return vm_get_count();
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100224}
225
226/**
227 * Returns the number of vcpus configured in the given VM.
228 */
Andrew Walbran42347a92019-05-09 13:59:03 +0100229int64_t api_vcpu_get_count(spci_vm_id_t vm_id, const struct vcpu *current)
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100230{
Andrew Scull19503262018-09-20 14:48:39 +0100231 struct vm *vm;
232
233 /* Only the primary VM needs to know about vcpus for scheduling. */
Wedson Almeida Filho00df6c72018-10-18 11:19:24 +0100234 if (current->vm->id != HF_PRIMARY_VM_ID) {
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100235 return -1;
Andrew Scull7364a8e2018-07-19 15:39:29 +0100236 }
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100237
Andrew Walbran42347a92019-05-09 13:59:03 +0100238 vm = vm_find(vm_id);
Andrew Scull19503262018-09-20 14:48:39 +0100239 if (vm == NULL) {
240 return -1;
241 }
242
243 return vm->vcpu_count;
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100244}
245
246/**
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000247 * This function is called by the architecture-specific context switching
248 * function to indicate that register state for the given vcpu has been saved
249 * and can therefore be used by other pcpus.
250 */
251void api_regs_state_saved(struct vcpu *vcpu)
252{
253 sl_lock(&vcpu->lock);
254 vcpu->regs_available = true;
255 sl_unlock(&vcpu->lock);
256}
257
258/**
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +0000259 * Retrieves the next waiter and removes it from the wait list if the VM's
260 * mailbox is in a writable state.
261 */
262static struct wait_entry *api_fetch_waiter(struct vm_locked locked_vm)
263{
264 struct wait_entry *entry;
265 struct vm *vm = locked_vm.vm;
266
Andrew Sculld6ee1102019-04-05 22:12:42 +0100267 if (vm->mailbox.state != MAILBOX_STATE_EMPTY ||
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +0000268 vm->mailbox.recv == NULL || list_empty(&vm->mailbox.waiter_list)) {
269 /* The mailbox is not writable or there are no waiters. */
270 return NULL;
271 }
272
273 /* Remove waiter from the wait list. */
274 entry = CONTAINER_OF(vm->mailbox.waiter_list.next, struct wait_entry,
275 wait_links);
276 list_remove(&entry->wait_links);
277 return entry;
278}
279
280/**
Andrew Walbran508e63c2018-12-20 17:02:37 +0000281 * Assuming that the arguments have already been checked by the caller, injects
282 * a virtual interrupt of the given ID into the given target vCPU. This doesn't
283 * cause the vCPU to actually be run immediately; it will be taken when the vCPU
284 * is next run, which is up to the scheduler.
285 *
286 * Returns:
287 * - 0 on success if no further action is needed.
288 * - 1 if it was called by the primary VM and the primary VM now needs to wake
289 * up or kick the target vCPU.
290 */
Andrew Walbranfc9d4382019-05-10 18:07:21 +0100291static int64_t internal_interrupt_inject(struct vcpu *target_vcpu,
Andrew Walbran508e63c2018-12-20 17:02:37 +0000292 uint32_t intid, struct vcpu *current,
293 struct vcpu **next)
294{
295 uint32_t intid_index = intid / INTERRUPT_REGISTER_BITS;
296 uint32_t intid_mask = 1u << (intid % INTERRUPT_REGISTER_BITS);
Andrew Walbran508e63c2018-12-20 17:02:37 +0000297 int64_t ret = 0;
298
299 sl_lock(&target_vcpu->lock);
Andrew Walbran508e63c2018-12-20 17:02:37 +0000300
301 /*
302 * We only need to change state and (maybe) trigger a virtual IRQ if it
303 * is enabled and was not previously pending. Otherwise we can skip
304 * everything except setting the pending bit.
305 *
306 * If you change this logic make sure to update the need_vm_lock logic
307 * above to match.
308 */
309 if (!(target_vcpu->interrupts.interrupt_enabled[intid_index] &
310 ~target_vcpu->interrupts.interrupt_pending[intid_index] &
311 intid_mask)) {
312 goto out;
313 }
314
315 /* Increment the count. */
316 target_vcpu->interrupts.enabled_and_pending_count++;
317
318 /*
319 * Only need to update state if there was not already an
320 * interrupt enabled and pending.
321 */
322 if (target_vcpu->interrupts.enabled_and_pending_count != 1) {
323 goto out;
324 }
325
Andrew Walbran508e63c2018-12-20 17:02:37 +0000326 if (current->vm->id == HF_PRIMARY_VM_ID) {
327 /*
328 * If the call came from the primary VM, let it know that it
329 * should run or kick the target vCPU.
330 */
331 ret = 1;
332 } else if (current != target_vcpu && next != NULL) {
Andrew Walbran33645652019-04-15 12:29:31 +0100333 *next = api_wake_up(current, target_vcpu);
Andrew Walbran508e63c2018-12-20 17:02:37 +0000334 }
335
336out:
337 /* Either way, make it pending. */
338 target_vcpu->interrupts.interrupt_pending[intid_index] |= intid_mask;
339
340 sl_unlock(&target_vcpu->lock);
Andrew Walbran508e63c2018-12-20 17:02:37 +0000341
342 return ret;
343}
344
345/**
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000346 * Prepares the vcpu to run by updating its state and fetching whether a return
347 * value needs to be forced onto the vCPU.
348 */
Andrew Scull38772ab2019-01-24 15:16:50 +0000349static bool api_vcpu_prepare_run(const struct vcpu *current, struct vcpu *vcpu,
Andrew Walbran508e63c2018-12-20 17:02:37 +0000350 struct hf_vcpu_run_return *run_ret)
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000351{
Andrew Scullb06d1752019-02-04 10:15:48 +0000352 bool need_vm_lock;
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000353 bool ret;
354
Andrew Scullb06d1752019-02-04 10:15:48 +0000355 /*
Andrew Scull4caadaf2019-07-03 13:13:47 +0100356 * Wait until the registers become available. All locks must be released
357 * between iterations of this loop to avoid potential deadlocks if, on
358 * any path, a lock needs to be taken after taking the decision to
359 * switch context but before the registers have been saved.
Andrew Scullb06d1752019-02-04 10:15:48 +0000360 *
Andrew Scull4caadaf2019-07-03 13:13:47 +0100361 * The VM lock is not needed in the common case so it must only be taken
362 * when it is going to be needed. This ensures there are no inter-vCPU
363 * dependencies in the common run case meaning the sensitive context
364 * switch performance is consistent.
Andrew Scullb06d1752019-02-04 10:15:48 +0000365 */
366 for (;;) {
367 sl_lock(&vcpu->lock);
368
369 /* The VM needs to be locked to deliver mailbox messages. */
Andrew Sculld6ee1102019-04-05 22:12:42 +0100370 need_vm_lock = vcpu->state == VCPU_STATE_BLOCKED_MAILBOX;
Andrew Scullb06d1752019-02-04 10:15:48 +0000371 if (need_vm_lock) {
372 sl_unlock(&vcpu->lock);
373 sl_lock(&vcpu->vm->lock);
374 sl_lock(&vcpu->lock);
375 }
376
377 if (vcpu->regs_available) {
378 break;
379 }
380
Andrew Sculld6ee1102019-04-05 22:12:42 +0100381 if (vcpu->state == VCPU_STATE_RUNNING) {
Andrew Scullb06d1752019-02-04 10:15:48 +0000382 /*
383 * vCPU is running on another pCPU.
384 *
Andrew Walbranabf88fb2019-06-21 12:17:47 +0100385 * It's ok not to return the sleep duration here because
Andrew Scullb06d1752019-02-04 10:15:48 +0000386 * the other physical CPU that is currently running this
Andrew Walbranabf88fb2019-06-21 12:17:47 +0100387 * vCPU will return the sleep duration if needed. The
388 * default return value is
389 * HF_VCPU_RUN_WAIT_FOR_INTERRUPT, so no need to set it
390 * explicitly.
Andrew Scullb06d1752019-02-04 10:15:48 +0000391 */
392 ret = false;
393 goto out;
394 }
395
396 sl_unlock(&vcpu->lock);
397 if (need_vm_lock) {
398 sl_unlock(&vcpu->vm->lock);
399 }
400 }
Andrew Scull9726c252019-01-23 13:44:19 +0000401
402 if (atomic_load_explicit(&vcpu->vm->aborting, memory_order_relaxed)) {
Andrew Sculld6ee1102019-04-05 22:12:42 +0100403 if (vcpu->state != VCPU_STATE_ABORTED) {
Andrew Scull82331282019-01-25 10:29:34 +0000404 dlog("Aborting VM %u vCPU %u\n", vcpu->vm->id,
405 vcpu_index(vcpu));
Andrew Sculld6ee1102019-04-05 22:12:42 +0100406 vcpu->state = VCPU_STATE_ABORTED;
Andrew Scull9726c252019-01-23 13:44:19 +0000407 }
408 ret = false;
409 goto out;
410 }
411
Andrew Walbran508e63c2018-12-20 17:02:37 +0000412 switch (vcpu->state) {
Andrew Sculld6ee1102019-04-05 22:12:42 +0100413 case VCPU_STATE_RUNNING:
414 case VCPU_STATE_OFF:
415 case VCPU_STATE_ABORTED:
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000416 ret = false;
417 goto out;
Andrew Scullb06d1752019-02-04 10:15:48 +0000418
Andrew Sculld6ee1102019-04-05 22:12:42 +0100419 case VCPU_STATE_BLOCKED_MAILBOX:
Andrew Scullb06d1752019-02-04 10:15:48 +0000420 /*
421 * A pending message allows the vCPU to run so the message can
422 * be delivered directly.
423 */
Andrew Sculld6ee1102019-04-05 22:12:42 +0100424 if (vcpu->vm->mailbox.state == MAILBOX_STATE_RECEIVED) {
Jose Marinho3e2442f2019-03-12 13:30:37 +0000425 arch_regs_set_retval(&vcpu->regs, SPCI_SUCCESS);
Andrew Sculld6ee1102019-04-05 22:12:42 +0100426 vcpu->vm->mailbox.state = MAILBOX_STATE_READ;
Andrew Scullb06d1752019-02-04 10:15:48 +0000427 break;
428 }
429 /* Fall through. */
Andrew Sculld6ee1102019-04-05 22:12:42 +0100430 case VCPU_STATE_BLOCKED_INTERRUPT:
Andrew Scullb06d1752019-02-04 10:15:48 +0000431 /* Allow virtual interrupts to be delivered. */
432 if (vcpu->interrupts.enabled_and_pending_count > 0) {
433 break;
434 }
435
436 /* The timer expired so allow the interrupt to be delivered. */
Andrew Walbran508e63c2018-12-20 17:02:37 +0000437 if (arch_timer_pending(&vcpu->regs)) {
438 break;
439 }
440
441 /*
442 * The vCPU is not ready to run, return the appropriate code to
443 * the primary which called vcpu_run.
444 */
445 if (arch_timer_enabled(&vcpu->regs)) {
Andrew Scullb06d1752019-02-04 10:15:48 +0000446 run_ret->code =
Andrew Sculld6ee1102019-04-05 22:12:42 +0100447 vcpu->state == VCPU_STATE_BLOCKED_MAILBOX
Andrew Scullb06d1752019-02-04 10:15:48 +0000448 ? HF_VCPU_RUN_WAIT_FOR_MESSAGE
449 : HF_VCPU_RUN_WAIT_FOR_INTERRUPT;
Andrew Walbran508e63c2018-12-20 17:02:37 +0000450 run_ret->sleep.ns =
451 arch_timer_remaining_ns(&vcpu->regs);
452 }
453
454 ret = false;
455 goto out;
Andrew Scullb06d1752019-02-04 10:15:48 +0000456
Andrew Sculld6ee1102019-04-05 22:12:42 +0100457 case VCPU_STATE_READY:
Andrew Walbran508e63c2018-12-20 17:02:37 +0000458 break;
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000459 }
460
Andrew Scullb06d1752019-02-04 10:15:48 +0000461 /* It has been decided that the vCPU should be run. */
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000462 vcpu->cpu = current->cpu;
Andrew Sculld6ee1102019-04-05 22:12:42 +0100463 vcpu->state = VCPU_STATE_RUNNING;
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000464
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000465 /*
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000466 * Mark the registers as unavailable now that we're about to reflect
467 * them onto the real registers. This will also prevent another physical
468 * CPU from trying to read these registers.
469 */
470 vcpu->regs_available = false;
471
472 ret = true;
473
474out:
475 sl_unlock(&vcpu->lock);
Andrew Scullb06d1752019-02-04 10:15:48 +0000476 if (need_vm_lock) {
477 sl_unlock(&vcpu->vm->lock);
478 }
479
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000480 return ret;
481}
482
483/**
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100484 * Runs the given vcpu of the given vm.
485 */
Andrew Walbranb037d5b2019-06-25 17:19:41 +0100486struct hf_vcpu_run_return api_vcpu_run(spci_vm_id_t vm_id,
487 spci_vcpu_index_t vcpu_idx,
Andrew Scull38772ab2019-01-24 15:16:50 +0000488 const struct vcpu *current,
489 struct vcpu **next)
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100490{
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100491 struct vm *vm;
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100492 struct vcpu *vcpu;
Andrew Scull6d2db332018-10-10 15:28:17 +0100493 struct hf_vcpu_run_return ret = {
494 .code = HF_VCPU_RUN_WAIT_FOR_INTERRUPT,
Andrew Scullb06d1752019-02-04 10:15:48 +0000495 .sleep.ns = HF_SLEEP_INDEFINITE,
Andrew Scull6d2db332018-10-10 15:28:17 +0100496 };
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100497
498 /* Only the primary VM can switch vcpus. */
Wedson Almeida Filho00df6c72018-10-18 11:19:24 +0100499 if (current->vm->id != HF_PRIMARY_VM_ID) {
Andrew Scull6d2db332018-10-10 15:28:17 +0100500 goto out;
Andrew Scull7364a8e2018-07-19 15:39:29 +0100501 }
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100502
Andrew Scull19503262018-09-20 14:48:39 +0100503 /* Only secondary VM vcpus can be run. */
504 if (vm_id == HF_PRIMARY_VM_ID) {
Andrew Scull6d2db332018-10-10 15:28:17 +0100505 goto out;
Andrew Scull7364a8e2018-07-19 15:39:29 +0100506 }
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100507
Andrew Scull19503262018-09-20 14:48:39 +0100508 /* The requested VM must exist. */
Andrew Walbran42347a92019-05-09 13:59:03 +0100509 vm = vm_find(vm_id);
Andrew Scull19503262018-09-20 14:48:39 +0100510 if (vm == NULL) {
Andrew Scull6d2db332018-10-10 15:28:17 +0100511 goto out;
Andrew Scull19503262018-09-20 14:48:39 +0100512 }
513
514 /* The requested vcpu must exist. */
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100515 if (vcpu_idx >= vm->vcpu_count) {
Andrew Scull6d2db332018-10-10 15:28:17 +0100516 goto out;
Andrew Scull7364a8e2018-07-19 15:39:29 +0100517 }
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100518
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000519 /* Update state if allowed. */
Andrew Walbrane1310df2019-04-29 17:28:28 +0100520 vcpu = vm_get_vcpu(vm, vcpu_idx);
Andrew Scullb06d1752019-02-04 10:15:48 +0000521 if (!api_vcpu_prepare_run(current, vcpu, &ret)) {
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000522 goto out;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100523 }
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000524
Andrew Walbran508e63c2018-12-20 17:02:37 +0000525 /*
526 * Inject timer interrupt if timer has expired. It's safe to access
527 * vcpu->regs here because api_vcpu_prepare_run already made sure that
528 * regs_available was true (and then set it to false) before returning
529 * true.
530 */
531 if (arch_timer_pending(&vcpu->regs)) {
532 /* Make virtual timer interrupt pending. */
Andrew Walbranfc9d4382019-05-10 18:07:21 +0100533 internal_interrupt_inject(vcpu, HF_VIRTUAL_TIMER_INTID, vcpu,
534 NULL);
Andrew Walbran508e63c2018-12-20 17:02:37 +0000535
536 /*
537 * Set the mask bit so the hardware interrupt doesn't fire
538 * again. Ideally we wouldn't do this because it affects what
539 * the secondary vCPU sees, but if we don't then we end up with
540 * a loop of the interrupt firing each time we try to return to
541 * the secondary vCPU.
542 */
543 arch_timer_mask(&vcpu->regs);
544 }
545
Andrew Scull33fecd32019-01-08 14:48:27 +0000546 /* Switch to the vcpu. */
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000547 *next = vcpu;
Wedson Almeida Filho03306112018-11-26 00:08:03 +0000548
Andrew Scull33fecd32019-01-08 14:48:27 +0000549 /*
550 * Set a placeholder return code to the scheduler. This will be
551 * overwritten when the switch back to the primary occurs.
552 */
553 ret.code = HF_VCPU_RUN_PREEMPTED;
554
Andrew Scull6d2db332018-10-10 15:28:17 +0100555out:
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100556 return ret;
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +0100557}
558
559/**
Andrew Scull81e85092018-12-12 12:56:20 +0000560 * Check that the mode indicates memory that is valid, owned and exclusive.
561 */
Andrew Scullcbefbdb2019-01-11 16:36:26 +0000562static bool api_mode_valid_owned_and_exclusive(int mode)
Andrew Scull81e85092018-12-12 12:56:20 +0000563{
564 return (mode & (MM_MODE_INVALID | MM_MODE_UNOWNED | MM_MODE_SHARED)) ==
565 0;
566}
567
568/**
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +0000569 * Determines the value to be returned by api_vm_configure and api_mailbox_clear
570 * after they've succeeded. If a secondary VM is running and there are waiters,
571 * it also switches back to the primary VM for it to wake waiters up.
572 */
573static int64_t api_waiter_result(struct vm_locked locked_vm,
574 struct vcpu *current, struct vcpu **next)
575{
576 struct vm *vm = locked_vm.vm;
577 struct hf_vcpu_run_return ret = {
578 .code = HF_VCPU_RUN_NOTIFY_WAITERS,
579 };
580
581 if (list_empty(&vm->mailbox.waiter_list)) {
582 /* No waiters, nothing else to do. */
583 return 0;
584 }
585
586 if (vm->id == HF_PRIMARY_VM_ID) {
587 /* The caller is the primary VM. Tell it to wake up waiters. */
588 return 1;
589 }
590
591 /*
592 * Switch back to the primary VM, informing it that there are waiters
593 * that need to be notified.
594 */
Andrew Sculld6ee1102019-04-05 22:12:42 +0100595 *next = api_switch_to_primary(current, ret, VCPU_STATE_READY);
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +0000596
597 return 0;
598}
599
600/**
Andrew Sculle1322792019-07-01 17:46:10 +0100601 * Configures the hypervisor's stage-1 view of the send and receive pages. The
602 * stage-1 page tables must be locked so memory cannot be taken by another core
603 * which could result in this transaction being unable to roll back in the case
604 * of an error.
605 */
606static bool api_vm_configure_stage1(struct vm_locked vm_locked,
607 paddr_t pa_send_begin, paddr_t pa_send_end,
608 paddr_t pa_recv_begin, paddr_t pa_recv_end,
609 struct mpool *local_page_pool)
610{
611 bool ret;
612 struct mm_stage1_locked mm_stage1_locked = mm_lock_stage1();
613
614 /* Map the send page as read-only in the hypervisor address space. */
615 vm_locked.vm->mailbox.send =
616 mm_identity_map(mm_stage1_locked, pa_send_begin, pa_send_end,
617 MM_MODE_R, local_page_pool);
618 if (!vm_locked.vm->mailbox.send) {
619 /* TODO: partial defrag of failed range. */
620 /* Recover any memory consumed in failed mapping. */
621 mm_defrag(mm_stage1_locked, local_page_pool);
622 goto fail;
623 }
624
625 /*
626 * Map the receive page as writable in the hypervisor address space. On
627 * failure, unmap the send page before returning.
628 */
629 vm_locked.vm->mailbox.recv =
630 mm_identity_map(mm_stage1_locked, pa_recv_begin, pa_recv_end,
631 MM_MODE_W, local_page_pool);
632 if (!vm_locked.vm->mailbox.recv) {
633 /* TODO: partial defrag of failed range. */
634 /* Recover any memory consumed in failed mapping. */
635 mm_defrag(mm_stage1_locked, local_page_pool);
636 goto fail_undo_send;
637 }
638
639 ret = true;
640 goto out;
641
642 /*
643 * The following mappings will not require more memory than is available
644 * in the local pool.
645 */
646fail_undo_send:
647 vm_locked.vm->mailbox.send = NULL;
Andrew Scull7e8de322019-07-02 13:00:56 +0100648 CHECK(mm_unmap(mm_stage1_locked, pa_send_begin, pa_send_end,
649 local_page_pool));
Andrew Sculle1322792019-07-01 17:46:10 +0100650
651fail:
652 ret = false;
653
654out:
655 mm_unlock_stage1(&mm_stage1_locked);
656
657 return ret;
658}
659
660/**
661 * Configures the send and receive pages in the VM stage-2 and hypervisor
662 * stage-1 page tables. Locking of the page tables combined with a local memory
663 * pool ensures there will always be enough memory to recover from any errors
664 * that arise.
665 */
666static bool api_vm_configure_pages(struct vm_locked vm_locked,
667 paddr_t pa_send_begin, paddr_t pa_send_end,
668 int orig_send_mode, paddr_t pa_recv_begin,
669 paddr_t pa_recv_end, int orig_recv_mode)
670{
671 bool ret;
672 struct mpool local_page_pool;
673
674 /*
675 * Create a local pool so any freed memory can't be used by another
676 * thread. This is to ensure the original mapping can be restored if any
677 * stage of the process fails.
678 */
679 mpool_init_with_fallback(&local_page_pool, &api_page_pool);
680
681 /* Take memory ownership away from the VM and mark as shared. */
682 if (!mm_vm_identity_map(
683 &vm_locked.vm->ptable, pa_send_begin, pa_send_end,
684 MM_MODE_UNOWNED | MM_MODE_SHARED | MM_MODE_R | MM_MODE_W,
685 NULL, &local_page_pool)) {
686 goto fail;
687 }
688
689 if (!mm_vm_identity_map(&vm_locked.vm->ptable, pa_recv_begin,
690 pa_recv_end,
691 MM_MODE_UNOWNED | MM_MODE_SHARED | MM_MODE_R,
692 NULL, &local_page_pool)) {
693 /* TODO: partial defrag of failed range. */
694 /* Recover any memory consumed in failed mapping. */
695 mm_vm_defrag(&vm_locked.vm->ptable, &local_page_pool);
696 goto fail_undo_send;
697 }
698
699 if (!api_vm_configure_stage1(vm_locked, pa_send_begin, pa_send_end,
700 pa_recv_begin, pa_recv_end,
701 &local_page_pool)) {
702 goto fail_undo_send_and_recv;
703 }
704
705 ret = true;
706 goto out;
707
708 /*
709 * The following mappings will not require more memory than is available
710 * in the local pool.
711 */
712fail_undo_send_and_recv:
Andrew Scull7e8de322019-07-02 13:00:56 +0100713 CHECK(mm_vm_identity_map(&vm_locked.vm->ptable, pa_recv_begin,
714 pa_recv_end, orig_recv_mode, NULL,
715 &local_page_pool));
Andrew Sculle1322792019-07-01 17:46:10 +0100716
717fail_undo_send:
Andrew Scull7e8de322019-07-02 13:00:56 +0100718 CHECK(mm_vm_identity_map(&vm_locked.vm->ptable, pa_send_begin,
719 pa_send_end, orig_send_mode, NULL,
720 &local_page_pool));
Andrew Sculle1322792019-07-01 17:46:10 +0100721
722fail:
723 ret = false;
724
725out:
726 mpool_fini(&local_page_pool);
727
728 return ret;
729}
730
731/**
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100732 * Configures the VM to send/receive data through the specified pages. The pages
733 * must not be shared.
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +0000734 *
735 * Returns:
736 * - -1 on failure.
737 * - 0 on success if no further action is needed.
738 * - 1 if it was called by the primary VM and the primary VM now needs to wake
739 * up or kick waiters. Waiters should be retrieved by calling
740 * hf_mailbox_waiter_get.
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100741 */
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +0000742int64_t api_vm_configure(ipaddr_t send, ipaddr_t recv, struct vcpu *current,
743 struct vcpu **next)
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100744{
Wedson Almeida Filho00df6c72018-10-18 11:19:24 +0100745 struct vm *vm = current->vm;
Andrew Sculle1322792019-07-01 17:46:10 +0100746 struct vm_locked vm_locked;
Andrew Scull80871322018-08-06 12:04:09 +0100747 paddr_t pa_send_begin;
748 paddr_t pa_send_end;
749 paddr_t pa_recv_begin;
750 paddr_t pa_recv_end;
Andrew Scull220e6212018-12-21 18:09:00 +0000751 int orig_send_mode;
752 int orig_recv_mode;
Andrew Scullc0e569a2018-10-02 18:05:21 +0100753 int64_t ret;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100754
755 /* Fail if addresses are not page-aligned. */
Alfredo Mazzinghieb1997c2019-02-07 18:00:01 +0000756 if (!is_aligned(ipa_addr(send), PAGE_SIZE) ||
757 !is_aligned(ipa_addr(recv), PAGE_SIZE)) {
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100758 return -1;
759 }
760
Andrew Scullc2eb6a32018-12-13 16:54:24 +0000761 /* Convert to physical addresses. */
762 pa_send_begin = pa_from_ipa(send);
763 pa_send_end = pa_add(pa_send_begin, PAGE_SIZE);
764
765 pa_recv_begin = pa_from_ipa(recv);
766 pa_recv_end = pa_add(pa_recv_begin, PAGE_SIZE);
767
Andrew Scullc9ccb3f2018-08-13 15:27:12 +0100768 /* Fail if the same page is used for the send and receive pages. */
769 if (pa_addr(pa_send_begin) == pa_addr(pa_recv_begin)) {
Andrew Scull220e6212018-12-21 18:09:00 +0000770 return -1;
771 }
772
Andrew Scull3c0a90a2019-07-01 11:55:53 +0100773 /*
774 * The hypervisor's memory map must be locked for the duration of this
775 * operation to ensure there will be sufficient memory to recover from
776 * any failures.
777 *
778 * TODO: the scope of the can be reduced but will require restructuring
779 * to keep a single unlock point.
780 */
Andrew Sculle1322792019-07-01 17:46:10 +0100781 vm_locked = vm_lock(vm);
Andrew Scull220e6212018-12-21 18:09:00 +0000782
783 /* We only allow these to be setup once. */
784 if (vm->mailbox.send || vm->mailbox.recv) {
785 goto fail;
786 }
787
788 /*
789 * Ensure the pages are valid, owned and exclusive to the VM and that
790 * the VM has the required access to the memory.
791 */
792 if (!mm_vm_get_mode(&vm->ptable, send, ipa_add(send, PAGE_SIZE),
793 &orig_send_mode) ||
794 !api_mode_valid_owned_and_exclusive(orig_send_mode) ||
795 (orig_send_mode & MM_MODE_R) == 0 ||
796 (orig_send_mode & MM_MODE_W) == 0) {
797 goto fail;
798 }
799
800 if (!mm_vm_get_mode(&vm->ptable, recv, ipa_add(recv, PAGE_SIZE),
801 &orig_recv_mode) ||
802 !api_mode_valid_owned_and_exclusive(orig_recv_mode) ||
803 (orig_recv_mode & MM_MODE_R) == 0) {
804 goto fail;
805 }
806
Andrew Sculle1322792019-07-01 17:46:10 +0100807 if (!api_vm_configure_pages(vm_locked, pa_send_begin, pa_send_end,
808 orig_send_mode, pa_recv_begin, pa_recv_end,
809 orig_recv_mode)) {
810 goto fail;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100811 }
812
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +0000813 /* Tell caller about waiters, if any. */
Andrew Sculle1322792019-07-01 17:46:10 +0100814 ret = api_waiter_result(vm_locked, current, next);
Andrew Scull220e6212018-12-21 18:09:00 +0000815 goto exit;
816
Andrew Scull220e6212018-12-21 18:09:00 +0000817fail:
818 ret = -1;
819
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100820exit:
Andrew Sculle1322792019-07-01 17:46:10 +0100821 vm_unlock(&vm_locked);
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100822
823 return ret;
824}
825
826/**
Andrew Scullaa039b32018-10-04 15:02:26 +0100827 * Copies data from the sender's send buffer to the recipient's receive buffer
828 * and notifies the recipient.
Wedson Almeida Filho17c997f2019-01-09 18:50:09 +0000829 *
830 * If the recipient's receive buffer is busy, it can optionally register the
831 * caller to be notified when the recipient's receive buffer becomes available.
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100832 */
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000833int32_t api_spci_msg_send(uint32_t attributes, struct vcpu *current,
834 struct vcpu **next)
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100835{
Wedson Almeida Filho00df6c72018-10-18 11:19:24 +0100836 struct vm *from = current->vm;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100837 struct vm *to;
Andrew Scullb06d1752019-02-04 10:15:48 +0000838 struct hf_vcpu_run_return primary_ret = {
839 .code = HF_VCPU_RUN_MESSAGE,
840 };
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000841 struct spci_message from_msg_replica;
842 struct spci_message *to_msg;
843 const struct spci_message *from_msg;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100844
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000845 uint32_t size;
Andrew Scull19503262018-09-20 14:48:39 +0100846
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000847 int64_t ret;
848 bool notify = (attributes & SPCI_MSG_SEND_NOTIFY_MASK) ==
849 SPCI_MSG_SEND_NOTIFY;
Andrew Scull19503262018-09-20 14:48:39 +0100850
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000851 /*
852 * Check that the sender has configured its send buffer. Copy the
853 * message header. If the tx mailbox at from_msg is configured (i.e.
854 * from_msg != NULL) then it can be safely accessed after releasing the
855 * lock since the tx mailbox address can only be configured once.
856 */
857 sl_lock(&from->lock);
858 from_msg = from->mailbox.send;
859 sl_unlock(&from->lock);
860
861 if (from_msg == NULL) {
862 return SPCI_INVALID_PARAMETERS;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100863 }
864
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100865 /*
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000866 * Note that the payload is not copied when the message header is.
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100867 */
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000868 from_msg_replica = *from_msg;
869
870 /* Ensure source VM id corresponds to the current VM. */
871 if (from_msg_replica.source_vm_id != from->id) {
872 return SPCI_INVALID_PARAMETERS;
873 }
874
875 size = from_msg_replica.length;
876 /* Limit the size of transfer. */
Andrew Scull1262ac22019-04-05 12:44:26 +0100877 if (size > SPCI_MSG_PAYLOAD_MAX) {
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000878 return SPCI_INVALID_PARAMETERS;
879 }
880
881 /* Disallow reflexive requests as this suggests an error in the VM. */
882 if (from_msg_replica.target_vm_id == from->id) {
883 return SPCI_INVALID_PARAMETERS;
884 }
885
886 /* Ensure the target VM exists. */
Andrew Walbran42347a92019-05-09 13:59:03 +0100887 to = vm_find(from_msg_replica.target_vm_id);
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000888 if (to == NULL) {
889 return SPCI_INVALID_PARAMETERS;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100890 }
891
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100892 sl_lock(&to->lock);
893
Andrew Sculld6ee1102019-04-05 22:12:42 +0100894 if (to->mailbox.state != MAILBOX_STATE_EMPTY ||
Andrew Scullaa039b32018-10-04 15:02:26 +0100895 to->mailbox.recv == NULL) {
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +0000896 /*
897 * Fail if the target isn't currently ready to receive data,
898 * setting up for notification if requested.
899 */
900 if (notify) {
Wedson Almeida Filhob790f652019-01-22 23:41:56 +0000901 struct wait_entry *entry =
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000902 &current->vm->wait_entries
903 [from_msg_replica.target_vm_id];
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +0000904
905 /* Append waiter only if it's not there yet. */
906 if (list_empty(&entry->wait_links)) {
907 list_append(&to->mailbox.waiter_list,
908 &entry->wait_links);
909 }
910 }
911
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000912 ret = SPCI_BUSY;
Andrew Scullaa039b32018-10-04 15:02:26 +0100913 goto out;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100914 }
915
Andrew Scullaa039b32018-10-04 15:02:26 +0100916 /* Copy data. */
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000917 to_msg = to->mailbox.recv;
918 *to_msg = from_msg_replica;
Andrew Sculla1aa2ba2019-04-05 11:49:02 +0100919 memcpy_s(to_msg->payload, SPCI_MSG_PAYLOAD_MAX,
920 from->mailbox.send->payload, size);
Andrew Scullb06d1752019-02-04 10:15:48 +0000921 primary_ret.message.vm_id = to->id;
Jose Marinhoa1dfeda2019-02-27 16:46:03 +0000922 ret = SPCI_SUCCESS;
Andrew Scullaa039b32018-10-04 15:02:26 +0100923
924 /* Messages for the primary VM are delivered directly. */
925 if (to->id == HF_PRIMARY_VM_ID) {
Andrew Sculld6ee1102019-04-05 22:12:42 +0100926 to->mailbox.state = MAILBOX_STATE_READ;
Wedson Almeida Filhoba641ef2018-12-03 04:19:44 +0000927 *next = api_switch_to_primary(current, primary_ret,
Andrew Sculld6ee1102019-04-05 22:12:42 +0100928 VCPU_STATE_READY);
Andrew Scullaa039b32018-10-04 15:02:26 +0100929 goto out;
930 }
931
Andrew Sculld6ee1102019-04-05 22:12:42 +0100932 to->mailbox.state = MAILBOX_STATE_RECEIVED;
Andrew Scullaa039b32018-10-04 15:02:26 +0100933
934 /* Return to the primary VM directly or with a switch. */
Andrew Scullb06d1752019-02-04 10:15:48 +0000935 if (from->id != HF_PRIMARY_VM_ID) {
Wedson Almeida Filhoba641ef2018-12-03 04:19:44 +0000936 *next = api_switch_to_primary(current, primary_ret,
Andrew Sculld6ee1102019-04-05 22:12:42 +0100937 VCPU_STATE_READY);
Wedson Almeida Filho80eb4a32018-11-30 17:11:15 +0000938 }
Andrew Scullaa039b32018-10-04 15:02:26 +0100939
940out:
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100941 sl_unlock(&to->lock);
942
Wedson Almeida Filho80eb4a32018-11-30 17:11:15 +0000943 return ret;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100944}
945
946/**
Andrew Scullaa039b32018-10-04 15:02:26 +0100947 * Receives a message from the mailbox. If one isn't available, this function
948 * can optionally block the caller until one becomes available.
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100949 *
Andrew Scullaa039b32018-10-04 15:02:26 +0100950 * No new messages can be received until the mailbox has been cleared.
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100951 */
Jose Marinho3e2442f2019-03-12 13:30:37 +0000952int32_t api_spci_msg_recv(uint32_t attributes, struct vcpu *current,
953 struct vcpu **next)
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100954{
Wedson Almeida Filho00df6c72018-10-18 11:19:24 +0100955 struct vm *vm = current->vm;
Jose Marinho3e2442f2019-03-12 13:30:37 +0000956 int32_t return_code;
957 bool block =
958 (attributes & SPCI_MSG_RECV_BLOCK_MASK) == SPCI_MSG_RECV_BLOCK;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100959
Andrew Scullaa039b32018-10-04 15:02:26 +0100960 /*
961 * The primary VM will receive messages as a status code from running
962 * vcpus and must not call this function.
963 */
Andrew Scull19503262018-09-20 14:48:39 +0100964 if (vm->id == HF_PRIMARY_VM_ID) {
Jose Marinho3e2442f2019-03-12 13:30:37 +0000965 return SPCI_INTERRUPTED;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100966 }
967
968 sl_lock(&vm->lock);
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100969
Andrew Scullaa039b32018-10-04 15:02:26 +0100970 /* Return pending messages without blocking. */
Andrew Sculld6ee1102019-04-05 22:12:42 +0100971 if (vm->mailbox.state == MAILBOX_STATE_RECEIVED) {
972 vm->mailbox.state = MAILBOX_STATE_READ;
Jose Marinho3e2442f2019-03-12 13:30:37 +0000973 return_code = SPCI_SUCCESS;
974 goto out;
975 }
976
977 /* No pending message so fail if not allowed to block. */
978 if (!block) {
979 return_code = SPCI_RETRY;
Andrew Scullaa039b32018-10-04 15:02:26 +0100980 goto out;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +0100981 }
Andrew Scullaa039b32018-10-04 15:02:26 +0100982
Andrew Walbran9311c9a2019-03-12 16:59:04 +0000983 /*
Jose Marinho3e2442f2019-03-12 13:30:37 +0000984 * From this point onward this call can only be interrupted or a message
985 * received. If a message is received the return value will be set at
986 * that time to SPCI_SUCCESS.
Andrew Walbran9311c9a2019-03-12 16:59:04 +0000987 */
Jose Marinho3e2442f2019-03-12 13:30:37 +0000988 return_code = SPCI_INTERRUPTED;
989
990 /*
991 * Don't block if there are enabled and pending interrupts, to match
992 * behaviour of wait_for_interrupt.
993 */
994 if (current->interrupts.enabled_and_pending_count > 0) {
Andrew Scullaa039b32018-10-04 15:02:26 +0100995 goto out;
996 }
997
Andrew Scullaa039b32018-10-04 15:02:26 +0100998 /* Switch back to primary vm to block. */
Andrew Walbranb4816552018-12-05 17:35:42 +0000999 {
1000 struct hf_vcpu_run_return run_return = {
Andrew Scullb06d1752019-02-04 10:15:48 +00001001 .code = HF_VCPU_RUN_WAIT_FOR_MESSAGE,
Andrew Walbranb4816552018-12-05 17:35:42 +00001002 };
Wedson Almeida Filho81568c42019-01-04 13:33:02 +00001003
Andrew Walbranb4816552018-12-05 17:35:42 +00001004 *next = api_switch_to_primary(current, run_return,
Andrew Sculld6ee1102019-04-05 22:12:42 +01001005 VCPU_STATE_BLOCKED_MAILBOX);
Andrew Walbranb4816552018-12-05 17:35:42 +00001006 }
Andrew Scullaa039b32018-10-04 15:02:26 +01001007out:
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +01001008 sl_unlock(&vm->lock);
1009
Jose Marinho3e2442f2019-03-12 13:30:37 +00001010 return return_code;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +01001011}
1012
1013/**
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +00001014 * Retrieves the next VM whose mailbox became writable. For a VM to be notified
1015 * by this function, the caller must have called api_mailbox_send before with
1016 * the notify argument set to true, and this call must have failed because the
1017 * mailbox was not available.
1018 *
1019 * It should be called repeatedly to retrieve a list of VMs.
1020 *
1021 * Returns -1 if no VM became writable, or the id of the VM whose mailbox
1022 * became writable.
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +01001023 */
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +00001024int64_t api_mailbox_writable_get(const struct vcpu *current)
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +01001025{
Wedson Almeida Filho00df6c72018-10-18 11:19:24 +01001026 struct vm *vm = current->vm;
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +00001027 struct wait_entry *entry;
Andrew Scullc0e569a2018-10-02 18:05:21 +01001028 int64_t ret;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +01001029
1030 sl_lock(&vm->lock);
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +00001031 if (list_empty(&vm->mailbox.ready_list)) {
1032 ret = -1;
1033 goto exit;
1034 }
1035
1036 entry = CONTAINER_OF(vm->mailbox.ready_list.next, struct wait_entry,
1037 ready_links);
1038 list_remove(&entry->ready_links);
Wedson Almeida Filhob790f652019-01-22 23:41:56 +00001039 ret = entry - vm->wait_entries;
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +00001040
1041exit:
1042 sl_unlock(&vm->lock);
1043 return ret;
1044}
1045
1046/**
1047 * Retrieves the next VM waiting to be notified that the mailbox of the
1048 * specified VM became writable. Only primary VMs are allowed to call this.
1049 *
Wedson Almeida Filhob790f652019-01-22 23:41:56 +00001050 * Returns -1 on failure or if there are no waiters; the VM id of the next
1051 * waiter otherwise.
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +00001052 */
Andrew Walbran42347a92019-05-09 13:59:03 +01001053int64_t api_mailbox_waiter_get(spci_vm_id_t vm_id, const struct vcpu *current)
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +00001054{
1055 struct vm *vm;
1056 struct vm_locked locked;
1057 struct wait_entry *entry;
1058 struct vm *waiting_vm;
1059
1060 /* Only primary VMs are allowed to call this function. */
1061 if (current->vm->id != HF_PRIMARY_VM_ID) {
1062 return -1;
1063 }
1064
Andrew Walbran42347a92019-05-09 13:59:03 +01001065 vm = vm_find(vm_id);
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +00001066 if (vm == NULL) {
1067 return -1;
1068 }
1069
1070 /* Check if there are outstanding notifications from given vm. */
Andrew Walbran7e932bd2019-04-29 16:47:06 +01001071 locked = vm_lock(vm);
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +00001072 entry = api_fetch_waiter(locked);
1073 vm_unlock(&locked);
1074
1075 if (entry == NULL) {
1076 return -1;
1077 }
1078
1079 /* Enqueue notification to waiting VM. */
1080 waiting_vm = entry->waiting_vm;
1081
1082 sl_lock(&waiting_vm->lock);
1083 if (list_empty(&entry->ready_links)) {
1084 list_append(&waiting_vm->mailbox.ready_list,
1085 &entry->ready_links);
1086 }
1087 sl_unlock(&waiting_vm->lock);
1088
1089 return waiting_vm->id;
1090}
1091
1092/**
1093 * Clears the caller's mailbox so that a new message can be received. The caller
1094 * must have copied out all data they wish to preserve as new messages will
1095 * overwrite the old and will arrive asynchronously.
1096 *
1097 * Returns:
Andrew Scullaa7db8e2019-02-01 14:12:19 +00001098 * - -1 on failure, if the mailbox hasn't been read.
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +00001099 * - 0 on success if no further action is needed.
1100 * - 1 if it was called by the primary VM and the primary VM now needs to wake
1101 * up or kick waiters. Waiters should be retrieved by calling
1102 * hf_mailbox_waiter_get.
1103 */
1104int64_t api_mailbox_clear(struct vcpu *current, struct vcpu **next)
1105{
1106 struct vm *vm = current->vm;
1107 struct vm_locked locked;
1108 int64_t ret;
1109
Andrew Walbran7e932bd2019-04-29 16:47:06 +01001110 locked = vm_lock(vm);
Andrew Scullaa7db8e2019-02-01 14:12:19 +00001111 switch (vm->mailbox.state) {
Andrew Sculld6ee1102019-04-05 22:12:42 +01001112 case MAILBOX_STATE_EMPTY:
Andrew Scullaa7db8e2019-02-01 14:12:19 +00001113 ret = 0;
1114 break;
1115
Andrew Sculld6ee1102019-04-05 22:12:42 +01001116 case MAILBOX_STATE_RECEIVED:
Andrew Scullaa7db8e2019-02-01 14:12:19 +00001117 ret = -1;
1118 break;
1119
Andrew Sculld6ee1102019-04-05 22:12:42 +01001120 case MAILBOX_STATE_READ:
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +00001121 ret = api_waiter_result(locked, current, next);
Andrew Sculld6ee1102019-04-05 22:12:42 +01001122 vm->mailbox.state = MAILBOX_STATE_EMPTY;
Andrew Scullaa7db8e2019-02-01 14:12:19 +00001123 break;
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +01001124 }
Wedson Almeida Filhoea62e2e2019-01-09 19:14:59 +00001125 vm_unlock(&locked);
Wedson Almeida Filho2f94ec12018-07-26 16:00:48 +01001126
1127 return ret;
Wedson Almeida Filho3fcbcff2018-07-10 23:53:39 +01001128}
Andrew Walbran318f5732018-11-20 16:23:42 +00001129
1130/**
1131 * Enables or disables a given interrupt ID for the calling vCPU.
1132 *
1133 * Returns 0 on success, or -1 if the intid is invalid.
1134 */
Wedson Almeida Filhoc559d132019-01-09 19:33:40 +00001135int64_t api_interrupt_enable(uint32_t intid, bool enable, struct vcpu *current)
Andrew Walbran318f5732018-11-20 16:23:42 +00001136{
1137 uint32_t intid_index = intid / INTERRUPT_REGISTER_BITS;
1138 uint32_t intid_mask = 1u << (intid % INTERRUPT_REGISTER_BITS);
Wedson Almeida Filho81568c42019-01-04 13:33:02 +00001139
Andrew Walbran318f5732018-11-20 16:23:42 +00001140 if (intid >= HF_NUM_INTIDS) {
1141 return -1;
1142 }
1143
1144 sl_lock(&current->lock);
1145 if (enable) {
Andrew Walbran3d84a262018-12-13 14:41:19 +00001146 /*
1147 * If it is pending and was not enabled before, increment the
1148 * count.
1149 */
1150 if (current->interrupts.interrupt_pending[intid_index] &
1151 ~current->interrupts.interrupt_enabled[intid_index] &
1152 intid_mask) {
1153 current->interrupts.enabled_and_pending_count++;
1154 }
Andrew Walbran318f5732018-11-20 16:23:42 +00001155 current->interrupts.interrupt_enabled[intid_index] |=
1156 intid_mask;
Andrew Walbran318f5732018-11-20 16:23:42 +00001157 } else {
Andrew Walbran3d84a262018-12-13 14:41:19 +00001158 /*
1159 * If it is pending and was enabled before, decrement the count.
1160 */
1161 if (current->interrupts.interrupt_pending[intid_index] &
1162 current->interrupts.interrupt_enabled[intid_index] &
1163 intid_mask) {
1164 current->interrupts.enabled_and_pending_count--;
1165 }
Andrew Walbran318f5732018-11-20 16:23:42 +00001166 current->interrupts.interrupt_enabled[intid_index] &=
1167 ~intid_mask;
1168 }
1169
1170 sl_unlock(&current->lock);
1171 return 0;
1172}
1173
1174/**
1175 * Returns the ID of the next pending interrupt for the calling vCPU, and
1176 * acknowledges it (i.e. marks it as no longer pending). Returns
1177 * HF_INVALID_INTID if there are no pending interrupts.
1178 */
Wedson Almeida Filhoc559d132019-01-09 19:33:40 +00001179uint32_t api_interrupt_get(struct vcpu *current)
Andrew Walbran318f5732018-11-20 16:23:42 +00001180{
1181 uint8_t i;
1182 uint32_t first_interrupt = HF_INVALID_INTID;
Andrew Walbran318f5732018-11-20 16:23:42 +00001183
1184 /*
1185 * Find the first enabled and pending interrupt ID, return it, and
1186 * deactivate it.
1187 */
1188 sl_lock(&current->lock);
1189 for (i = 0; i < HF_NUM_INTIDS / INTERRUPT_REGISTER_BITS; ++i) {
1190 uint32_t enabled_and_pending =
1191 current->interrupts.interrupt_enabled[i] &
1192 current->interrupts.interrupt_pending[i];
Wedson Almeida Filho81568c42019-01-04 13:33:02 +00001193
Andrew Walbran318f5732018-11-20 16:23:42 +00001194 if (enabled_and_pending != 0) {
Andrew Walbran3d84a262018-12-13 14:41:19 +00001195 uint8_t bit_index = ctz(enabled_and_pending);
1196 /*
1197 * Mark it as no longer pending and decrement the count.
1198 */
1199 current->interrupts.interrupt_pending[i] &=
1200 ~(1u << bit_index);
1201 current->interrupts.enabled_and_pending_count--;
1202 first_interrupt =
1203 i * INTERRUPT_REGISTER_BITS + bit_index;
Andrew Walbran318f5732018-11-20 16:23:42 +00001204 break;
1205 }
1206 }
Andrew Walbran318f5732018-11-20 16:23:42 +00001207
1208 sl_unlock(&current->lock);
1209 return first_interrupt;
1210}
1211
1212/**
Andrew Walbran4cf217a2018-12-14 15:24:50 +00001213 * Returns whether the current vCPU is allowed to inject an interrupt into the
Andrew Walbran318f5732018-11-20 16:23:42 +00001214 * given VM and vCPU.
1215 */
1216static inline bool is_injection_allowed(uint32_t target_vm_id,
1217 struct vcpu *current)
1218{
1219 uint32_t current_vm_id = current->vm->id;
Wedson Almeida Filho81568c42019-01-04 13:33:02 +00001220
Andrew Walbran318f5732018-11-20 16:23:42 +00001221 /*
1222 * The primary VM is allowed to inject interrupts into any VM. Secondary
1223 * VMs are only allowed to inject interrupts into their own vCPUs.
1224 */
1225 return current_vm_id == HF_PRIMARY_VM_ID ||
1226 current_vm_id == target_vm_id;
1227}
1228
1229/**
1230 * Injects a virtual interrupt of the given ID into the given target vCPU.
1231 * This doesn't cause the vCPU to actually be run immediately; it will be taken
1232 * when the vCPU is next run, which is up to the scheduler.
1233 *
Andrew Walbran3d84a262018-12-13 14:41:19 +00001234 * Returns:
1235 * - -1 on failure because the target VM or vCPU doesn't exist, the interrupt
1236 * ID is invalid, or the current VM is not allowed to inject interrupts to
1237 * the target VM.
1238 * - 0 on success if no further action is needed.
1239 * - 1 if it was called by the primary VM and the primary VM now needs to wake
1240 * up or kick the target vCPU.
Andrew Walbran318f5732018-11-20 16:23:42 +00001241 */
Andrew Walbran42347a92019-05-09 13:59:03 +01001242int64_t api_interrupt_inject(spci_vm_id_t target_vm_id,
Andrew Walbranb037d5b2019-06-25 17:19:41 +01001243 spci_vcpu_index_t target_vcpu_idx, uint32_t intid,
Andrew Walbran42347a92019-05-09 13:59:03 +01001244 struct vcpu *current, struct vcpu **next)
Andrew Walbran318f5732018-11-20 16:23:42 +00001245{
Andrew Walbran318f5732018-11-20 16:23:42 +00001246 struct vcpu *target_vcpu;
Andrew Walbran42347a92019-05-09 13:59:03 +01001247 struct vm *target_vm = vm_find(target_vm_id);
Andrew Walbran318f5732018-11-20 16:23:42 +00001248
1249 if (intid >= HF_NUM_INTIDS) {
1250 return -1;
1251 }
Wedson Almeida Filho81568c42019-01-04 13:33:02 +00001252
Andrew Walbran318f5732018-11-20 16:23:42 +00001253 if (target_vm == NULL) {
1254 return -1;
1255 }
Wedson Almeida Filho81568c42019-01-04 13:33:02 +00001256
Andrew Walbran318f5732018-11-20 16:23:42 +00001257 if (target_vcpu_idx >= target_vm->vcpu_count) {
1258 /* The requested vcpu must exist. */
1259 return -1;
1260 }
Wedson Almeida Filho81568c42019-01-04 13:33:02 +00001261
Andrew Walbran318f5732018-11-20 16:23:42 +00001262 if (!is_injection_allowed(target_vm_id, current)) {
1263 return -1;
1264 }
Wedson Almeida Filho81568c42019-01-04 13:33:02 +00001265
Andrew Walbrane1310df2019-04-29 17:28:28 +01001266 target_vcpu = vm_get_vcpu(target_vm, target_vcpu_idx);
Andrew Walbran318f5732018-11-20 16:23:42 +00001267
1268 dlog("Injecting IRQ %d for VM %d VCPU %d from VM %d VCPU %d\n", intid,
1269 target_vm_id, target_vcpu_idx, current->vm->id, current->cpu->id);
Andrew Walbranfc9d4382019-05-10 18:07:21 +01001270 return internal_interrupt_inject(target_vcpu, intid, current, next);
Andrew Walbran318f5732018-11-20 16:23:42 +00001271}
Andrew Scull6386f252018-12-06 13:29:10 +00001272
1273/**
1274 * Clears a region of physical memory by overwriting it with zeros. The data is
1275 * flushed from the cache so the memory has been cleared across the system.
1276 */
1277static bool api_clear_memory(paddr_t begin, paddr_t end, struct mpool *ppool)
1278{
1279 /*
1280 * TODO: change this to a cpu local single page window rather than a
1281 * global mapping of the whole range. Such an approach will limit
1282 * the changes to stage-1 tables and will allow only local
1283 * invalidation.
1284 */
Andrew Scull3c0a90a2019-07-01 11:55:53 +01001285 bool ret;
1286 struct mm_stage1_locked stage1_locked = mm_lock_stage1();
1287 void *ptr =
1288 mm_identity_map(stage1_locked, begin, end, MM_MODE_W, ppool);
Andrew Walbran2cb43392019-04-17 12:52:45 +01001289 size_t size = pa_difference(begin, end);
Andrew Scull6386f252018-12-06 13:29:10 +00001290
1291 if (!ptr) {
1292 /* TODO: partial defrag of failed range. */
1293 /* Recover any memory consumed in failed mapping. */
Andrew Scull3c0a90a2019-07-01 11:55:53 +01001294 mm_defrag(stage1_locked, ppool);
1295 goto fail;
Andrew Scull6386f252018-12-06 13:29:10 +00001296 }
1297
Andrew Scull2b5fbad2019-04-05 13:55:56 +01001298 memset_s(ptr, size, 0, size);
Andrew Scull6386f252018-12-06 13:29:10 +00001299 arch_mm_write_back_dcache(ptr, size);
Andrew Scull3c0a90a2019-07-01 11:55:53 +01001300 mm_unmap(stage1_locked, begin, end, ppool);
Andrew Scull6386f252018-12-06 13:29:10 +00001301
Andrew Scull3c0a90a2019-07-01 11:55:53 +01001302 ret = true;
1303 goto out;
1304
1305fail:
1306 ret = false;
1307
1308out:
1309 mm_unlock_stage1(&stage1_locked);
1310
1311 return ret;
Andrew Scull6386f252018-12-06 13:29:10 +00001312}
1313
1314/**
1315 * Shares memory from the calling VM with another. The memory can be shared in
1316 * different modes.
1317 *
1318 * TODO: the interface for sharing memory will need to be enhanced to allow
1319 * sharing with different modes e.g. read-only, informing the recipient
1320 * of the memory they have been given, opting to not wipe the memory and
1321 * possibly allowing multiple blocks to be transferred. What this will
1322 * look like is TBD.
1323 */
Andrew Walbran42347a92019-05-09 13:59:03 +01001324int64_t api_share_memory(spci_vm_id_t vm_id, ipaddr_t addr, size_t size,
Andrew Scull6386f252018-12-06 13:29:10 +00001325 enum hf_share share, struct vcpu *current)
1326{
1327 struct vm *from = current->vm;
1328 struct vm *to;
1329 int orig_from_mode;
1330 int from_mode;
1331 int to_mode;
1332 ipaddr_t begin;
1333 ipaddr_t end;
1334 paddr_t pa_begin;
1335 paddr_t pa_end;
1336 struct mpool local_page_pool;
1337 int64_t ret;
1338
1339 /* Disallow reflexive shares as this suggests an error in the VM. */
1340 if (vm_id == from->id) {
1341 return -1;
1342 }
1343
1344 /* Ensure the target VM exists. */
Andrew Walbran42347a92019-05-09 13:59:03 +01001345 to = vm_find(vm_id);
Andrew Scull6386f252018-12-06 13:29:10 +00001346 if (to == NULL) {
1347 return -1;
1348 }
1349
1350 begin = addr;
1351 end = ipa_add(addr, size);
1352
1353 /* Fail if addresses are not page-aligned. */
Alfredo Mazzinghieb1997c2019-02-07 18:00:01 +00001354 if (!is_aligned(ipa_addr(begin), PAGE_SIZE) ||
1355 !is_aligned(ipa_addr(end), PAGE_SIZE)) {
Andrew Scull6386f252018-12-06 13:29:10 +00001356 return -1;
1357 }
1358
1359 /* Convert the sharing request to memory management modes. */
1360 switch (share) {
1361 case HF_MEMORY_GIVE:
1362 from_mode = MM_MODE_INVALID | MM_MODE_UNOWNED;
1363 to_mode = MM_MODE_R | MM_MODE_W | MM_MODE_X;
1364 break;
1365
1366 case HF_MEMORY_LEND:
1367 from_mode = MM_MODE_INVALID;
1368 to_mode = MM_MODE_R | MM_MODE_W | MM_MODE_X | MM_MODE_UNOWNED;
1369 break;
1370
1371 case HF_MEMORY_SHARE:
1372 from_mode = MM_MODE_R | MM_MODE_W | MM_MODE_X | MM_MODE_SHARED;
1373 to_mode = MM_MODE_R | MM_MODE_W | MM_MODE_X | MM_MODE_UNOWNED |
1374 MM_MODE_SHARED;
1375 break;
1376
1377 default:
1378 /* The input is untrusted so might not be a valid value. */
1379 return -1;
1380 }
1381
1382 /*
1383 * Create a local pool so any freed memory can't be used by another
1384 * thread. This is to ensure the original mapping can be restored if any
1385 * stage of the process fails.
1386 */
1387 mpool_init_with_fallback(&local_page_pool, &api_page_pool);
1388
1389 sl_lock_both(&from->lock, &to->lock);
1390
1391 /*
1392 * Ensure that the memory range is mapped with the same mode so that
1393 * changes can be reverted if the process fails.
1394 */
1395 if (!mm_vm_get_mode(&from->ptable, begin, end, &orig_from_mode)) {
1396 goto fail;
1397 }
1398
1399 /*
1400 * Ensure the memory range is valid for the sender. If it isn't, the
1401 * sender has either shared it with another VM already or has no claim
1402 * to the memory.
1403 */
1404 if (orig_from_mode & MM_MODE_INVALID) {
1405 goto fail;
1406 }
1407
1408 /*
1409 * The sender must own the memory and have exclusive access to it in
1410 * order to share it. Alternatively, it is giving memory back to the
1411 * owning VM.
1412 */
1413 if (orig_from_mode & MM_MODE_UNOWNED) {
1414 int orig_to_mode;
1415
1416 if (share != HF_MEMORY_GIVE ||
1417 !mm_vm_get_mode(&to->ptable, begin, end, &orig_to_mode) ||
1418 orig_to_mode & MM_MODE_UNOWNED) {
1419 goto fail;
1420 }
1421 } else if (orig_from_mode & MM_MODE_SHARED) {
1422 goto fail;
1423 }
1424
1425 pa_begin = pa_from_ipa(begin);
1426 pa_end = pa_from_ipa(end);
1427
1428 /*
1429 * First update the mapping for the sender so there is not overlap with
1430 * the recipient.
1431 */
1432 if (!mm_vm_identity_map(&from->ptable, pa_begin, pa_end, from_mode,
1433 NULL, &local_page_pool)) {
1434 goto fail;
1435 }
1436
1437 /* Clear the memory so no VM or device can see the previous contents. */
1438 if (!api_clear_memory(pa_begin, pa_end, &local_page_pool)) {
1439 goto fail_return_to_sender;
1440 }
1441
1442 /* Complete the transfer by mapping the memory into the recipient. */
1443 if (!mm_vm_identity_map(&to->ptable, pa_begin, pa_end, to_mode, NULL,
1444 &local_page_pool)) {
1445 /* TODO: partial defrag of failed range. */
1446 /* Recover any memory consumed in failed mapping. */
1447 mm_vm_defrag(&from->ptable, &local_page_pool);
1448 goto fail_return_to_sender;
1449 }
1450
1451 ret = 0;
1452 goto out;
1453
1454fail_return_to_sender:
Andrew Scull7e8de322019-07-02 13:00:56 +01001455 CHECK(mm_vm_identity_map(&from->ptable, pa_begin, pa_end,
1456 orig_from_mode, NULL, &local_page_pool));
Andrew Scull6386f252018-12-06 13:29:10 +00001457
1458fail:
1459 ret = -1;
1460
1461out:
1462 sl_unlock(&from->lock);
1463 sl_unlock(&to->lock);
1464
1465 mpool_fini(&local_page_pool);
1466
1467 return ret;
1468}
Jose Marinhofc0b2b62019-06-06 11:18:45 +01001469
1470/** Returns the version of the implemented SPCI specification. */
1471int32_t api_spci_version(void)
1472{
1473 /*
1474 * Ensure that both major and minor revision representation occupies at
1475 * most 15 bits.
1476 */
1477 static_assert(0x8000 > SPCI_VERSION_MAJOR,
1478 "Major revision representation take more than 15 bits.");
1479 static_assert(0x10000 > SPCI_VERSION_MINOR,
1480 "Minor revision representation take more than 16 bits.");
1481
1482 return (SPCI_VERSION_MAJOR << SPCI_VERSION_MAJOR_OFFSET) |
1483 SPCI_VERSION_MINOR;
1484}