Blame - main.c - hafnium/driver/linux - TrustedFirmware Git Browser

blob: b83840703a5f512b0944af2a7d89391eebdf7426 [file] [log] [blame]

Andrew Scull	0177811	2019-01-14 15:37:53 +0000	[diff] [blame]	1	// SPDX-License-Identifier: GPL-2.0-only
Andrew Walbran	13c3a0b	2018-11-30 11:51:53 +0000	[diff] [blame]	2	/*
Andrew Walbran	2bc0a32	2019-03-07 15:48:06 +0000	[diff] [blame]	3	* Copyright 2018 The Hafnium Authors.
Andrew Walbran	13c3a0b	2018-11-30 11:51:53 +0000	[diff] [blame]	4	*
				5	* This program is free software; you can redistribute it and/or
				6	* modify it under the terms of the GNU General Public License
				7	* version 2 as published by the Free Software Foundation.
				8	*
				9	* This program is distributed in the hope that it will be useful,
				10	* but WITHOUT ANY WARRANTY; without even the implied warranty of
				11	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
				12	* GNU General Public License for more details.
Andrew Walbran	13c3a0b	2018-11-30 11:51:53 +0000	[diff] [blame]	13	*/
				14
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	15	#include <clocksource/arm_arch_timer.h>
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	16	#include <linux/atomic.h>
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	17	#include <linux/cpuhotplug.h>
				18	#include <linux/hrtimer.h>
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	19	#include <linux/init.h>
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	20	#include <linux/interrupt.h>
				21	#include <linux/irq.h>
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	22	#include <linux/kernel.h>
				23	#include <linux/kthread.h>
Wedson Almeida Filho	f9e1192	2018-08-12 15:54:31 +0100	[diff] [blame]	24	#include <linux/mm.h>
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	25	#include <linux/module.h>
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	26	#include <linux/net.h>
				27	#include <linux/of.h>
				28	#include <linux/platform_device.h>
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	29	#include <linux/sched/task.h>
				30	#include <linux/slab.h>
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	31	#include <net/sock.h>
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	32
Andrew Scull	5570423	2018-08-10 17:19:54 +0100	[diff] [blame]	33	#include <hf/call.h>
Jose Marinho	1cc6c75	2019-03-11 16:28:03 +0000	[diff] [blame]	34	#include <hf/spci.h>
Fuad Tabba	3e669bc	2019-08-08 16:43:55 +0100	[diff] [blame]	35	#include <hf/transport.h>
Andrew Scull	5570423	2018-08-10 17:19:54 +0100	[diff] [blame]	36
Fuad Tabba	3e669bc	2019-08-08 16:43:55 +0100	[diff] [blame]	37	#include "uapi/hf/socket.h"
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	38
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	39	#define HYPERVISOR_TIMER_NAME "el2_timer"
				40
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	41	#define CONFIG_HAFNIUM_MAX_VMS 16
				42	#define CONFIG_HAFNIUM_MAX_VCPUS 32
				43
Fuad Tabba	5da4b6b	2019-08-05 13:56:20 +0100	[diff] [blame]	44	#define FIRST_SECONDARY_VM_ID (HF_VM_ID_OFFSET + 1)
Wedson Almeida Filho	ec84193	2019-01-22 23:07:50 +0000	[diff] [blame]	45
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	46	struct hf_vcpu {
Andrew Scull	b722f95	2018-09-27 15:39:10 +0100	[diff] [blame]	47	struct hf_vm *vm;
Andrew Walbran	ddc3394	2019-06-25 18:32:02 +0100	[diff] [blame]	48	spci_vcpu_index_t vcpu_index;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	49	struct task_struct *task;
Wedson Almeida Filho	7fe6233	2018-12-15 03:09:57 +0000	[diff] [blame]	50	atomic_t abort_sleep;
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	51	atomic_t waiting_for_message;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	52	struct hrtimer timer;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	53	};
				54
				55	struct hf_vm {
Andrew Walbran	4c96d0c	2019-06-25 18:32:56 +0100	[diff] [blame]	56	spci_vm_id_t id;
Andrew Walbran	3eeb1de	2019-06-25 18:32:30 +0100	[diff] [blame]	57	spci_vcpu_count_t vcpu_count;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	58	struct hf_vcpu *vcpu;
				59	};
				60
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	61	struct hf_sock {
				62	/* This needs to be the first field. */
				63	struct sock sk;
				64
				65	/*
				66	* The following fields are immutable after the socket transitions to
				67	* SS_CONNECTED state.
				68	*/
				69	uint64_t local_port;
				70	uint64_t remote_port;
				71	struct hf_vm *peer_vm;
				72	};
				73
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	74	static struct proto hf_sock_proto = {
				75	.name = "hafnium",
				76	.owner = THIS_MODULE,
				77	.obj_size = sizeof(struct hf_sock),
				78	};
				79
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	80	static struct hf_vm *hf_vms;
Andrew Walbran	4c96d0c	2019-06-25 18:32:56 +0100	[diff] [blame]	81	static spci_vm_count_t hf_vm_count;
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	82	static struct page *hf_send_page;
				83	static struct page *hf_recv_page;
				84	static atomic64_t hf_next_port = ATOMIC64_INIT(0);
				85	static DEFINE_SPINLOCK(hf_send_lock);
				86	static DEFINE_HASHTABLE(hf_local_port_hash, 7);
				87	static DEFINE_SPINLOCK(hf_local_port_hash_lock);
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	88	static int hf_irq;
Andrew Walbran	8d55e50	2019-02-05 11:42:08 +0000	[diff] [blame]	89	static enum cpuhp_state hf_cpuhp_state;
Jose Marinho	1cc6c75	2019-03-11 16:28:03 +0000	[diff] [blame]	90	static spci_vm_id_t current_vm_id;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	91
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	92	/**
Wedson Almeida Filho	ec84193	2019-01-22 23:07:50 +0000	[diff] [blame]	93	* Retrieves a VM from its ID, returning NULL if the VM doesn't exist.
				94	*/
Andrew Walbran	01390ae	2019-06-19 11:32:46 +0100	[diff] [blame]	95	static struct hf_vm *hf_vm_from_id(spci_vm_id_t vm_id)
Wedson Almeida Filho	ec84193	2019-01-22 23:07:50 +0000	[diff] [blame]	96	{
				97	if (vm_id < FIRST_SECONDARY_VM_ID \|\|
				98	vm_id >= FIRST_SECONDARY_VM_ID + hf_vm_count)
				99	return NULL;
				100
				101	return &hf_vms[vm_id - FIRST_SECONDARY_VM_ID];
				102	}
				103
				104	/**
Wedson Almeida Filho	7fe6233	2018-12-15 03:09:57 +0000	[diff] [blame]	105	* Wakes up the kernel thread responsible for running the given vcpu.
				106	*
				107	* Returns 0 if the thread was already running, 1 otherwise.
				108	*/
				109	static int hf_vcpu_wake_up(struct hf_vcpu *vcpu)
				110	{
				111	/* Set a flag indicating that the thread should not go to sleep. */
				112	atomic_set(&vcpu->abort_sleep, 1);
				113
				114	/* Set the thread to running state. */
				115	return wake_up_process(vcpu->task);
				116	}
				117
				118	/**
				119	* Puts the current thread to sleep. The current thread must be responsible for
				120	* running the given vcpu.
				121	*
				122	* Going to sleep will fail if hf_vcpu_wake_up() or kthread_stop() was called on
				123	* this vcpu/thread since the last time it [re]started running.
				124	*/
				125	static void hf_vcpu_sleep(struct hf_vcpu *vcpu)
				126	{
				127	int abort;
				128
				129	set_current_state(TASK_INTERRUPTIBLE);
				130
				131	/* Check the sleep-abort flag after making thread interruptible. */
				132	abort = atomic_read(&vcpu->abort_sleep);
				133	if (!abort && !kthread_should_stop())
				134	schedule();
				135
				136	/* Set state back to running on the way out. */
				137	set_current_state(TASK_RUNNING);
				138	}
				139
				140	/**
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	141	* Wakes up the thread associated with the vcpu that owns the given timer. This
				142	* is called when the timer the thread is waiting on expires.
				143	*/
				144	static enum hrtimer_restart hf_vcpu_timer_expired(struct hrtimer *timer)
				145	{
				146	struct hf_vcpu *vcpu = container_of(timer, struct hf_vcpu, timer);
Wedson Almeida Filho	7fe6233	2018-12-15 03:09:57 +0000	[diff] [blame]	147	/* TODO: Inject interrupt. */
				148	hf_vcpu_wake_up(vcpu);
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	149	return HRTIMER_NORESTART;
				150	}
				151
				152	/**
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	153	* This function is called when Hafnium requests that the primary VM wake up a
				154	* vCPU that belongs to a secondary VM.
				155	*
				156	* It wakes up the thread if it's sleeping, or kicks it if it's already running.
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	157	*/
Andrew Walbran	ddc3394	2019-06-25 18:32:02 +0100	[diff] [blame]	158	static void hf_handle_wake_up_request(spci_vm_id_t vm_id,
				159	spci_vcpu_index_t vcpu)
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	160	{
Wedson Almeida Filho	ec84193	2019-01-22 23:07:50 +0000	[diff] [blame]	161	struct hf_vm *vm = hf_vm_from_id(vm_id);
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	162
Wedson Almeida Filho	ec84193	2019-01-22 23:07:50 +0000	[diff] [blame]	163	if (!vm) {
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	164	pr_warn("Request to wake up non-existent VM id: %u\n", vm_id);
				165	return;
				166	}
				167
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	168	if (vcpu >= vm->vcpu_count) {
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	169	pr_warn("Request to wake up non-existent vCPU: %u.%u\n",
				170	vm_id, vcpu);
				171	return;
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	172	}
				173
				174	if (hf_vcpu_wake_up(&vm->vcpu[vcpu]) == 0) {
				175	/*
				176	* The task was already running (presumably on a different
				177	* physical CPU); interrupt it. This gives Hafnium a chance to
				178	* inject any new interrupts.
				179	*/
				180	kick_process(vm->vcpu[vcpu].task);
				181	}
				182	}
				183
				184	/**
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	185	* Injects an interrupt into a vCPU of the VM and ensures the vCPU will run to
				186	* handle the interrupt.
				187	*/
Andrew Walbran	01390ae	2019-06-19 11:32:46 +0100	[diff] [blame]	188	static void hf_interrupt_vm(spci_vm_id_t vm_id, uint64_t int_id)
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	189	{
				190	struct hf_vm *vm = hf_vm_from_id(vm_id);
Andrew Walbran	ddc3394	2019-06-25 18:32:02 +0100	[diff] [blame]	191	spci_vcpu_index_t vcpu;
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	192	int64_t ret;
				193
				194	if (!vm) {
				195	pr_warn("Request to wake up non-existent VM id: %u\n", vm_id);
				196	return;
				197	}
				198
				199	/*
				200	* TODO: For now we're picking the first vcpu to interrupt, but
				201	* we want to be smarter.
				202	*/
				203	vcpu = 0;
				204	ret = hf_interrupt_inject(vm_id, vcpu, int_id);
				205
				206	if (ret == -1) {
				207	pr_warn("Failed to inject interrupt %lld to vCPU %d of VM %d",
				208	int_id, vcpu, vm_id);
				209	return;
				210	}
				211
				212	if (ret != 1) {
				213	/* We don't need to wake up the vcpu. */
				214	return;
				215	}
				216
				217	hf_handle_wake_up_request(vm_id, vcpu);
				218	}
				219
				220	/**
Wedson Almeida Filho	cd9fef9	2019-01-11 21:24:08 +0000	[diff] [blame]	221	* Notify all waiters on the given VM.
				222	*/
Andrew Walbran	01390ae	2019-06-19 11:32:46 +0100	[diff] [blame]	223	static void hf_notify_waiters(spci_vm_id_t vm_id)
Wedson Almeida Filho	cd9fef9	2019-01-11 21:24:08 +0000	[diff] [blame]	224	{
Andrew Walbran	01390ae	2019-06-19 11:32:46 +0100	[diff] [blame]	225	spci_vm_id_t waiter_vm_id;
Wedson Almeida Filho	cd9fef9	2019-01-11 21:24:08 +0000	[diff] [blame]	226
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	227	while ((waiter_vm_id = hf_mailbox_waiter_get(vm_id)) != -1) {
				228	if (waiter_vm_id == HF_PRIMARY_VM_ID) {
Wedson Almeida Filho	cd9fef9	2019-01-11 21:24:08 +0000	[diff] [blame]	229	/*
				230	* TODO: Use this information when implementing per-vm
				231	* queues.
				232	*/
				233	} else {
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	234	hf_interrupt_vm(waiter_vm_id,
				235	HF_MAILBOX_WRITABLE_INTID);
Wedson Almeida Filho	cd9fef9	2019-01-11 21:24:08 +0000	[diff] [blame]	236	}
				237	}
				238	}
				239
				240	/**
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	241	* Delivers a message to a VM.
				242	*/
Andrew Walbran	01390ae	2019-06-19 11:32:46 +0100	[diff] [blame]	243	static void hf_deliver_message(spci_vm_id_t vm_id)
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	244	{
				245	struct hf_vm *vm = hf_vm_from_id(vm_id);
Andrew Walbran	3eeb1de	2019-06-25 18:32:30 +0100	[diff] [blame]	246	spci_vcpu_index_t i;
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	247
				248	if (!vm) {
				249	pr_warn("Tried to deliver message to non-existent VM id: %u\n",
				250	vm_id);
				251	return;
				252	}
				253
				254	/* Try to wake a vCPU that is waiting for a message. */
				255	for (i = 0; i < vm->vcpu_count; i++) {
				256	if (atomic_read(&vm->vcpu[i].waiting_for_message)) {
				257	hf_handle_wake_up_request(vm->id,
				258	vm->vcpu[i].vcpu_index);
				259	return;
				260	}
				261	}
				262
				263	/* None were waiting for a message so interrupt one. */
				264	hf_interrupt_vm(vm->id, HF_MAILBOX_READABLE_INTID);
				265	}
				266
				267	/**
Andrew Scull	df6478f	2019-02-19 17:52:08 +0000	[diff] [blame]	268	* Handles a message delivered to this VM by validating that it's well-formed
				269	* and then queueing it for delivery to the appropriate socket.
				270	*/
Andrew Walbran	b331fa9	2019-10-03 16:48:07 +0100	[diff] [blame]	271	static void hf_handle_message(struct hf_vm *sender, size_t len,
Andrew Walbran	cafe017	2019-10-07 14:14:05 +0100	[diff] [blame]	272	const void *message)
Andrew Scull	df6478f	2019-02-19 17:52:08 +0000	[diff] [blame]	273	{
				274	struct hf_sock *hsock;
Andrew Walbran	cafe017	2019-10-07 14:14:05 +0100	[diff] [blame]	275	const struct hf_msg_hdr hdr = (struct hf_msg_hdr )message;
Andrew Scull	df6478f	2019-02-19 17:52:08 +0000	[diff] [blame]	276	struct sk_buff *skb;
				277	int err;
				278
				279	/* Ignore messages that are too small to hold a header. */
Marc Bonnici	39fdefd	2019-11-08 15:05:07 +0000	[diff] [blame^]	280	if (len < sizeof(struct hf_msg_hdr)) {
				281	pr_err("Message received without header of length %d\n", len);
				282	spci_rx_release();
Andrew Scull	df6478f	2019-02-19 17:52:08 +0000	[diff] [blame]	283	return;
Marc Bonnici	39fdefd	2019-11-08 15:05:07 +0000	[diff] [blame^]	284	}
Andrew Scull	df6478f	2019-02-19 17:52:08 +0000	[diff] [blame]	285
				286	len -= sizeof(struct hf_msg_hdr);
				287
				288	/* Go through the colliding sockets. */
				289	rcu_read_lock();
				290	hash_for_each_possible_rcu(hf_local_port_hash, hsock, sk.sk_node,
				291	hdr->dst_port) {
				292	if (hsock->peer_vm == sender &&
				293	hsock->remote_port == hdr->src_port) {
				294	sock_hold(&hsock->sk);
				295	break;
				296	}
				297	}
				298	rcu_read_unlock();
				299
				300	/* Nothing to do if we couldn't find the target. */
Marc Bonnici	39fdefd	2019-11-08 15:05:07 +0000	[diff] [blame^]	301	if (!hsock) {
				302	spci_rx_release();
Andrew Scull	df6478f	2019-02-19 17:52:08 +0000	[diff] [blame]	303	return;
Marc Bonnici	39fdefd	2019-11-08 15:05:07 +0000	[diff] [blame^]	304	}
Andrew Scull	df6478f	2019-02-19 17:52:08 +0000	[diff] [blame]	305
				306	/*
				307	* TODO: From this point on, there are two failure paths: when we
				308	* create the skb below, and when we enqueue it to the socket. What
				309	* should we do if they fail? Ideally we would have some form of flow
				310	* control to prevent message loss, but how to do it efficiently?
				311	*
				312	* One option is to have a pre-allocated message that indicates to the
				313	* sender that a message was dropped. This way we guarantee that the
				314	* sender will be aware of loss and should back-off.
				315	*/
				316	/* Create the skb. */
				317	skb = alloc_skb(len, GFP_KERNEL);
				318	if (!skb)
				319	goto exit;
				320
				321	memcpy(skb_put(skb, len), hdr + 1, len);
				322
				323	/*
				324	* Add the skb to the receive queue of the target socket. On success it
				325	* calls sk->sk_data_ready, which is currently set to sock_def_readable,
				326	* which wakes up any waiters.
				327	*/
				328	err = sock_queue_rcv_skb(&hsock->sk, skb);
				329	if (err)
				330	kfree_skb(skb);
				331
				332	exit:
				333	sock_put(&hsock->sk);
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	334
Andrew Walbran	73c3279	2019-11-05 13:09:23 +0000	[diff] [blame]	335	if (spci_rx_release().func == SPCI_RX_RELEASE_32)
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	336	hf_notify_waiters(HF_PRIMARY_VM_ID);
Andrew Scull	df6478f	2019-02-19 17:52:08 +0000	[diff] [blame]	337	}
				338
				339	/**
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	340	* This is the main loop of each vcpu.
				341	*/
				342	static int hf_vcpu_thread(void *data)
				343	{
				344	struct hf_vcpu *vcpu = data;
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	345	struct spci_value ret;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	346
				347	hrtimer_init(&vcpu->timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
				348	vcpu->timer.function = &hf_vcpu_timer_expired;
				349
				350	while (!kthread_should_stop()) {
Andrew Walbran	3eeb1de	2019-06-25 18:32:30 +0100	[diff] [blame]	351	spci_vcpu_index_t i;
Andrew Scull	01f83de	2019-01-23 13:41:47 +0000	[diff] [blame]	352
Wedson Almeida Filho	7fe6233	2018-12-15 03:09:57 +0000	[diff] [blame]	353	/*
				354	* We're about to run the vcpu, so we can reset the abort-sleep
				355	* flag.
				356	*/
				357	atomic_set(&vcpu->abort_sleep, 0);
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	358
Andrew Scull	bb7ae41	2018-09-28 21:07:15 +0100	[diff] [blame]	359	/* Call into Hafnium to run vcpu. */
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	360	ret = spci_run(vcpu->vm->id, vcpu->vcpu_index);
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	361
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	362	switch (ret.func) {
Andrew Scull	e05702e	2019-01-08 14:46:46 +0000	[diff] [blame]	363	/* Preempted. */
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	364	case SPCI_INTERRUPT_32:
Andrew Scull	e05702e	2019-01-08 14:46:46 +0000	[diff] [blame]	365	if (need_resched())
				366	schedule();
				367	break;
				368
				369	/* Yield. */
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	370	case SPCI_YIELD_32:
Andrew Scull	e05702e	2019-01-08 14:46:46 +0000	[diff] [blame]	371	if (!kthread_should_stop())
				372	schedule();
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	373	break;
				374
Andrew Scull	0177811	2019-01-14 15:37:53 +0000	[diff] [blame]	375	/* WFI. */
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	376	case HF_SPCI_RUN_WAIT_FOR_INTERRUPT:
				377	if (ret.arg2 != SPCI_SLEEP_INDEFINITE) {
				378	hrtimer_start(&vcpu->timer, ret.arg2,
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	379	HRTIMER_MODE_REL);
				380	}
Wedson Almeida Filho	7fe6233	2018-12-15 03:09:57 +0000	[diff] [blame]	381	hf_vcpu_sleep(vcpu);
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	382	hrtimer_cancel(&vcpu->timer);
				383	break;
				384
				385	/* Waiting for a message. */
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	386	case SPCI_MSG_WAIT_32:
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	387	atomic_set(&vcpu->waiting_for_message, 1);
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	388	if (ret.arg2 != SPCI_SLEEP_INDEFINITE) {
				389	hrtimer_start(&vcpu->timer, ret.arg2,
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	390	HRTIMER_MODE_REL);
				391	}
				392	hf_vcpu_sleep(vcpu);
				393	hrtimer_cancel(&vcpu->timer);
				394	atomic_set(&vcpu->waiting_for_message, 0);
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	395	break;
				396
Andrew Scull	b3a61b5	2018-09-17 14:30:34 +0100	[diff] [blame]	397	/* Wake up another vcpu. */
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	398	case HF_SPCI_RUN_WAKE_UP:
Andrew Walbran	6aef655	2019-11-05 11:18:10 +0000	[diff] [blame]	399	hf_handle_wake_up_request(spci_vm_id(ret),
				400	spci_vcpu_index(ret));
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	401	break;
Wedson Almeida Filho	f9e1192	2018-08-12 15:54:31 +0100	[diff] [blame]	402
Andrew Scull	b3a61b5	2018-09-17 14:30:34 +0100	[diff] [blame]	403	/* Response available. */
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	404	case SPCI_MSG_SEND_32:
				405	if (spci_msg_send_receiver(ret) == HF_PRIMARY_VM_ID) {
				406	hf_handle_message(vcpu->vm,
				407	spci_msg_send_size(ret),
Andrew Scull	9470423	2019-04-01 12:36:37 +0100	[diff] [blame]	408	page_address(hf_recv_page));
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	409	} else {
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	410	hf_deliver_message(spci_msg_send_receiver(ret));
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	411	}
Andrew Scull	dc8cab5	2018-10-10 18:29:39 +0100	[diff] [blame]	412	break;
Wedson Almeida Filho	cd9fef9	2019-01-11 21:24:08 +0000	[diff] [blame]	413
				414	/* Notify all waiters. */
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	415	case SPCI_RX_RELEASE_32:
Wedson Almeida Filho	cd9fef9	2019-01-11 21:24:08 +0000	[diff] [blame]	416	hf_notify_waiters(vcpu->vm->id);
				417	break;
Andrew Scull	01f83de	2019-01-23 13:41:47 +0000	[diff] [blame]	418
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	419	/* Abort was triggered. */
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	420	case SPCI_ERROR_32:
Andrew Walbran	18f08a6	2019-11-13 11:57:52 +0000	[diff] [blame]	421	pr_warn("SPCI error %d running VM %d vCPU %d", ret.arg2,
				422	vcpu->vm->id, vcpu->vcpu_index);
Andrew Walbran	39bf789	2019-11-01 14:14:47 +0000	[diff] [blame]	423	switch (ret.arg2) {
				424	case SPCI_ABORTED:
				425	for (i = 0; i < vcpu->vm->vcpu_count; i++) {
				426	if (i == vcpu->vcpu_index)
				427	continue;
				428	hf_handle_wake_up_request(vcpu->vm->id,
				429	i);
				430	}
				431	hf_vcpu_sleep(vcpu);
				432	break;
Andrew Scull	01f83de	2019-01-23 13:41:47 +0000	[diff] [blame]	433	}
Andrew Scull	01f83de	2019-01-23 13:41:47 +0000	[diff] [blame]	434	break;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	435	}
				436	}
				437
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	438	return 0;
				439	}
				440
				441	/**
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	442	* Converts a pointer to a struct sock into a pointer to a struct hf_sock. It
				443	* relies on the fact that the first field of hf_sock is a sock.
				444	*/
				445	static struct hf_sock hsock_from_sk(struct sock sk)
				446	{
				447	return (struct hf_sock *)sk;
				448	}
				449
				450	/**
				451	* This is called when the last reference to the outer socket is released. For
				452	* example, if it's a user-space socket, when the last file descriptor pointing
				453	* to this socket is closed.
				454	*
				455	* It begins cleaning up resources, though some can only be cleaned up after all
				456	* references to the underlying socket are released, which is handled by
				457	* hf_sock_destruct().
				458	*/
				459	static int hf_sock_release(struct socket *sock)
				460	{
				461	struct sock *sk = sock->sk;
				462	struct hf_sock *hsock = hsock_from_sk(sk);
				463	unsigned long flags;
				464
				465	if (!sk)
				466	return 0;
				467
				468	/* Shutdown for both send and receive. */
				469	lock_sock(sk);
				470	sk->sk_shutdown \|= RCV_SHUTDOWN \| SEND_SHUTDOWN;
				471	sk->sk_state_change(sk);
				472	release_sock(sk);
				473
				474	/* Remove from the hash table, so lookups from now on won't find it. */
				475	spin_lock_irqsave(&hf_local_port_hash_lock, flags);
				476	hash_del_rcu(&hsock->sk.sk_node);
				477	spin_unlock_irqrestore(&hf_local_port_hash_lock, flags);
				478
				479	/*
				480	* TODO: When we implement a tx queue, we need to clear it here so that
				481	* sk_wmem_alloc will not prevent sk from being freed (sk_free).
				482	*/
				483
				484	/*
				485	* Wait for in-flight lookups to finish. We need to do this here because
Wedson Almeida Filho	89d0e47	2019-01-03 19:18:39 +0000	[diff] [blame]	486	* in-flight lookups rely on the reference to the socket we're about to
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	487	* release.
				488	*/
				489	synchronize_rcu();
				490	sock_put(sk);
				491	sock->sk = NULL;
				492
				493	return 0;
				494	}
				495
				496	/**
				497	* This is called when there are no more references to the socket. It frees all
				498	* resources that haven't been freed during release.
				499	*/
				500	static void hf_sock_destruct(struct sock *sk)
				501	{
				502	/*
				503	* Clear the receive queue now that the handler cannot add any more
				504	* skbs to it.
				505	*/
				506	skb_queue_purge(&sk->sk_receive_queue);
				507	}
				508
				509	/**
				510	* Connects the Hafnium socket to the provided VM and port. After the socket is
				511	* connected, it can be used to exchange datagrams with the specified peer.
				512	*/
Andrew Scull	0177811	2019-01-14 15:37:53 +0000	[diff] [blame]	513	static int hf_sock_connect(struct socket sock, struct sockaddr saddr, int len,
				514	int connect_flags)
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	515	{
				516	struct sock *sk = sock->sk;
				517	struct hf_sock *hsock = hsock_from_sk(sk);
				518	struct hf_vm *vm;
Fuad Tabba	3e669bc	2019-08-08 16:43:55 +0100	[diff] [blame]	519	struct hf_sockaddr *addr;
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	520	int err;
				521	unsigned long flags;
				522
				523	/* Basic address validation. */
Fuad Tabba	3e669bc	2019-08-08 16:43:55 +0100	[diff] [blame]	524	if (len < sizeof(struct hf_sockaddr) \|\| saddr->sa_family != AF_HF)
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	525	return -EINVAL;
				526
Fuad Tabba	3e669bc	2019-08-08 16:43:55 +0100	[diff] [blame]	527	addr = (struct hf_sockaddr *)saddr;
Wedson Almeida Filho	ec84193	2019-01-22 23:07:50 +0000	[diff] [blame]	528	vm = hf_vm_from_id(addr->vm_id);
				529	if (!vm)
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	530	return -ENETUNREACH;
				531
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	532	/*
				533	* TODO: Once we implement access control in Hafnium, check that the
				534	* caller is allowed to contact the specified VM. Return -ECONNREFUSED
				535	* if access is denied.
				536	*/
				537
				538	/* Take lock to make sure state doesn't change as we connect. */
				539	lock_sock(sk);
				540
				541	/* Only unconnected sockets are allowed to become connected. */
				542	if (sock->state != SS_UNCONNECTED) {
				543	err = -EISCONN;
				544	goto exit;
				545	}
				546
				547	hsock->local_port = atomic64_inc_return(&hf_next_port);
				548	hsock->remote_port = addr->port;
				549	hsock->peer_vm = vm;
				550
				551	sock->state = SS_CONNECTED;
				552
				553	/* Add socket to hash table now that it's fully initialised. */
				554	spin_lock_irqsave(&hf_local_port_hash_lock, flags);
				555	hash_add_rcu(hf_local_port_hash, &sk->sk_node, hsock->local_port);
				556	spin_unlock_irqrestore(&hf_local_port_hash_lock, flags);
				557
				558	err = 0;
				559	exit:
				560	release_sock(sk);
				561	return err;
				562	}
				563
				564	/**
				565	* Sends the given skb to the appropriate VM by calling Hafnium. It will also
				566	* trigger the wake up of a recipient VM.
				567	*
				568	* Takes ownership of the skb on success.
				569	*/
				570	static int hf_send_skb(struct sk_buff *skb)
				571	{
				572	unsigned long flags;
Andrew Walbran	cafe017	2019-10-07 14:14:05 +0100	[diff] [blame]	573	struct spci_value ret;
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	574	struct hf_sock *hsock = hsock_from_sk(skb->sk);
				575	struct hf_vm *vm = hsock->peer_vm;
Andrew Walbran	cafe017	2019-10-07 14:14:05 +0100	[diff] [blame]	576	void *message = page_address(hf_send_page);
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	577
				578	/*
				579	* Call Hafnium under the send lock so that we serialize the use of the
				580	* global send buffer.
				581	*/
				582	spin_lock_irqsave(&hf_send_lock, flags);
Andrew Walbran	cafe017	2019-10-07 14:14:05 +0100	[diff] [blame]	583	memcpy(message, skb->data, skb->len);
Jose Marinho	1cc6c75	2019-03-11 16:28:03 +0000	[diff] [blame]	584
Andrew Walbran	cafe017	2019-10-07 14:14:05 +0100	[diff] [blame]	585	ret = spci_msg_send(current_vm_id, vm->id, skb->len, 0);
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	586	spin_unlock_irqrestore(&hf_send_lock, flags);
				587
Andrew Walbran	cafe017	2019-10-07 14:14:05 +0100	[diff] [blame]	588	if (ret.func == SPCI_ERROR_32) {
Andrew Walbran	b040b30	2019-10-10 13:50:06 +0100	[diff] [blame]	589	switch (ret.arg2) {
Andrew Walbran	cafe017	2019-10-07 14:14:05 +0100	[diff] [blame]	590	case SPCI_INVALID_PARAMETERS:
				591	return -ENXIO;
				592	case SPCI_NOT_SUPPORTED:
				593	return -EIO;
				594	case SPCI_DENIED:
				595	case SPCI_BUSY:
				596	default:
				597	return -EAGAIN;
				598	}
				599	}
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	600
Andrew Scull	71f5736	2019-02-05 16:11:35 +0000	[diff] [blame]	601	/* Ensure the VM will run to pick up the message. */
				602	hf_deliver_message(vm->id);
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	603
				604	kfree_skb(skb);
				605
				606	return 0;
				607	}
				608
				609	/**
				610	* Determines if the given socket is in the connected state. It acquires and
				611	* releases the socket lock.
				612	*/
				613	static bool hf_sock_is_connected(struct socket *sock)
				614	{
				615	bool ret;
				616
				617	lock_sock(sock->sk);
				618	ret = sock->state == SS_CONNECTED;
				619	release_sock(sock->sk);
				620
				621	return ret;
				622	}
				623
				624	/**
				625	* Sends a message to the VM & port the socket is connected to. All variants
				626	* of write/send/sendto/sendmsg eventually call this function.
				627	*/
				628	static int hf_sock_sendmsg(struct socket sock, struct msghdr m, size_t len)
				629	{
				630	struct sock *sk = sock->sk;
				631	struct sk_buff *skb;
				632	int err;
				633	struct hf_msg_hdr *hdr;
				634	struct hf_sock *hsock = hsock_from_sk(sk);
Andrew Walbran	cafe017	2019-10-07 14:14:05 +0100	[diff] [blame]	635	size_t payload_max_len = HF_MAILBOX_SIZE - sizeof(struct hf_msg_hdr);
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	636
				637	/* Check length. */
Andrew Scull	614ed7f	2019-04-01 12:12:38 +0100	[diff] [blame]	638	if (len > payload_max_len)
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	639	return -EMSGSIZE;
				640
				641	/* We don't allow the destination address to be specified. */
				642	if (m->msg_namelen > 0)
				643	return -EISCONN;
				644
				645	/* We don't support out of band messages. */
				646	if (m->msg_flags & MSG_OOB)
				647	return -EOPNOTSUPP;
				648
				649	/*
				650	* Ensure that the socket is connected. We don't need to hold the socket
				651	* lock (acquired and released by hf_sock_is_connected) for the
				652	* remainder of the function because the fields we care about are
				653	* immutable once the state is SS_CONNECTED.
				654	*/
				655	if (!hf_sock_is_connected(sock))
				656	return -ENOTCONN;
				657
				658	/*
				659	* Allocate an skb for this write. If there isn't enough room in the
				660	* socket's send buffer (sk_wmem_alloc >= sk_sndbuf), this will block
				661	* (if it's a blocking call). On success, it increments sk_wmem_alloc
				662	* and sets up the skb such that sk_wmem_alloc gets decremented when
				663	* the skb is freed (sock_wfree gets called).
				664	*/
				665	skb = sock_alloc_send_skb(sk, len + sizeof(struct hf_msg_hdr),
				666	m->msg_flags & MSG_DONTWAIT, &err);
				667	if (!skb)
				668	return err;
				669
				670	/* Reserve room for the header and initialise it. */
				671	skb_reserve(skb, sizeof(struct hf_msg_hdr));
				672	hdr = skb_push(skb, sizeof(struct hf_msg_hdr));
				673	hdr->src_port = hsock->local_port;
				674	hdr->dst_port = hsock->remote_port;
				675
				676	/* Allocate area for the contents, then copy into skb. */
				677	if (!copy_from_iter_full(skb_put(skb, len), len, &m->msg_iter)) {
				678	err = -EFAULT;
				679	goto err_cleanup;
				680	}
				681
				682	/*
				683	* TODO: We currently do this inline, but when we have support for
				684	* readiness notification from Hafnium, we must add this to a per-VM tx
				685	* queue that can make progress when the VM becomes writable. This will
				686	* fix send buffering and poll readiness notification.
				687	*/
				688	err = hf_send_skb(skb);
				689	if (err)
				690	goto err_cleanup;
				691
				692	return 0;
				693
				694	err_cleanup:
				695	kfree_skb(skb);
				696	return err;
				697	}
				698
				699	/**
				700	* Receives a message originated from the VM & port the socket is connected to.
				701	* All variants of read/recv/recvfrom/recvmsg eventually call this function.
				702	*/
				703	static int hf_sock_recvmsg(struct socket sock, struct msghdr m, size_t len,
				704	int flags)
				705	{
				706	struct sock *sk = sock->sk;
				707	struct sk_buff *skb;
				708	int err;
				709	size_t copy_len;
				710
				711	if (!hf_sock_is_connected(sock))
				712	return -ENOTCONN;
				713
				714	/* Grab the next skb from the receive queue. */
				715	skb = skb_recv_datagram(sk, flags, flags & MSG_DONTWAIT, &err);
				716	if (!skb)
				717	return err;
				718
				719	/* Make sure we don't copy more than what fits in the output buffer. */
				720	copy_len = skb->len;
				721	if (copy_len > len) {
				722	copy_len = len;
				723	m->msg_flags \|= MSG_TRUNC;
				724	}
				725
				726	/* Make sure we don't overflow the return value type. */
				727	if (copy_len > INT_MAX) {
				728	copy_len = INT_MAX;
				729	m->msg_flags \|= MSG_TRUNC;
				730	}
				731
				732	/* Copy skb to output iterator, then free it. */
				733	err = skb_copy_datagram_msg(skb, 0, m, copy_len);
				734	skb_free_datagram(sk, skb);
				735	if (err)
				736	return err;
				737
				738	return copy_len;
				739	}
				740
				741	/**
				742	* This function is called when a Hafnium socket is created. It initialises all
				743	* state such that the caller will be able to connect the socket and then send
				744	* and receive messages through it.
				745	*/
				746	static int hf_sock_create(struct net net, struct socket sock, int protocol,
Andrew Scull	0177811	2019-01-14 15:37:53 +0000	[diff] [blame]	747	int kern)
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	748	{
				749	static const struct proto_ops ops = {
				750	.family = PF_HF,
				751	.owner = THIS_MODULE,
				752	.release = hf_sock_release,
				753	.bind = sock_no_bind,
				754	.connect = hf_sock_connect,
				755	.socketpair = sock_no_socketpair,
				756	.accept = sock_no_accept,
				757	.ioctl = sock_no_ioctl,
				758	.listen = sock_no_listen,
				759	.shutdown = sock_no_shutdown,
				760	.setsockopt = sock_no_setsockopt,
				761	.getsockopt = sock_no_getsockopt,
				762	.sendmsg = hf_sock_sendmsg,
				763	.recvmsg = hf_sock_recvmsg,
				764	.mmap = sock_no_mmap,
				765	.sendpage = sock_no_sendpage,
				766	.poll = datagram_poll,
				767	};
				768	struct sock *sk;
				769
				770	if (sock->type != SOCK_DGRAM)
				771	return -ESOCKTNOSUPPORT;
				772
				773	if (protocol != 0)
				774	return -EPROTONOSUPPORT;
				775
				776	/*
				777	* For now we only allow callers with sys admin capability to create
				778	* Hafnium sockets.
				779	*/
				780	if (!capable(CAP_SYS_ADMIN))
				781	return -EPERM;
				782
				783	/* Allocate and initialise socket. */
				784	sk = sk_alloc(net, PF_HF, GFP_KERNEL, &hf_sock_proto, kern);
				785	if (!sk)
				786	return -ENOMEM;
				787
				788	sock_init_data(sock, sk);
				789
				790	sk->sk_destruct = hf_sock_destruct;
				791	sock->ops = &ops;
				792	sock->state = SS_UNCONNECTED;
				793
				794	return 0;
				795	}
				796
				797	/**
Andrew Scull	bb7ae41	2018-09-28 21:07:15 +0100	[diff] [blame]	798	* Frees all resources, including threads, associated with the Hafnium driver.
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	799	*/
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	800	static void hf_free_resources(void)
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	801	{
Fuad Tabba	5da4b6b	2019-08-05 13:56:20 +0100	[diff] [blame]	802	uint16_t i;
Andrew Walbran	4c96d0c	2019-06-25 18:32:56 +0100	[diff] [blame]	803	spci_vcpu_index_t j;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	804
				805	/*
				806	* First stop all worker threads. We need to do this before freeing
				807	* resources because workers may reference each other, so it is only
				808	* safe to free resources after they have all stopped.
				809	*/
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	810	for (i = 0; i < hf_vm_count; i++) {
Andrew Scull	b3a61b5	2018-09-17 14:30:34 +0100	[diff] [blame]	811	struct hf_vm *vm = &hf_vms[i];
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	812
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	813	for (j = 0; j < vm->vcpu_count; j++)
				814	kthread_stop(vm->vcpu[j].task);
				815	}
				816
				817	/* Free resources. */
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	818	for (i = 0; i < hf_vm_count; i++) {
Andrew Scull	b3a61b5	2018-09-17 14:30:34 +0100	[diff] [blame]	819	struct hf_vm *vm = &hf_vms[i];
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	820
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	821	for (j = 0; j < vm->vcpu_count; j++)
				822	put_task_struct(vm->vcpu[j].task);
				823	kfree(vm->vcpu);
				824	}
				825
				826	kfree(hf_vms);
				827	}
				828
Andrew Scull	bb7ae41	2018-09-28 21:07:15 +0100	[diff] [blame]	829	/**
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	830	* Handles the hypervisor timer interrupt.
				831	*/
				832	static irqreturn_t hf_nop_irq_handler(int irq, void *dev)
				833	{
				834	/*
				835	* No need to do anything, the interrupt only exists to return to the
				836	* primary vCPU so that the virtual timer will be restored and fire as
				837	* normal.
				838	*/
				839	return IRQ_HANDLED;
				840	}
				841
				842	/**
				843	* Enables the hypervisor timer interrupt on a CPU, when it starts or after the
				844	* driver is first loaded.
				845	*/
				846	static int hf_starting_cpu(unsigned int cpu)
				847	{
				848	if (hf_irq != 0) {
				849	/* Enable the interrupt, and set it to be edge-triggered. */
				850	enable_percpu_irq(hf_irq, IRQ_TYPE_EDGE_RISING);
				851	}
Andrew Walbran	8d55e50	2019-02-05 11:42:08 +0000	[diff] [blame]	852
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	853	return 0;
				854	}
				855
				856	/**
				857	* Disables the hypervisor timer interrupt on a CPU when it is powered down.
				858	*/
				859	static int hf_dying_cpu(unsigned int cpu)
				860	{
				861	if (hf_irq != 0) {
				862	/* Disable the interrupt while the CPU is asleep. */
				863	disable_percpu_irq(hf_irq);
				864	}
				865
				866	return 0;
				867	}
				868
				869	/**
				870	* Registers for the hypervisor timer interrupt.
				871	*/
				872	static int hf_int_driver_probe(struct platform_device *pdev)
				873	{
				874	int irq;
				875	int ret;
				876
				877	/*
				878	* Register a handler for the hyperviser timer IRQ, as it is needed for
				879	* Hafnium to emulate the virtual timer for Linux while a secondary vCPU
				880	* is running.
				881	*/
				882	irq = platform_get_irq(pdev, ARCH_TIMER_HYP_PPI);
				883	if (irq < 0) {
				884	pr_err("Error getting hypervisor timer IRQ: %d\n", irq);
				885	return irq;
				886	}
				887	hf_irq = irq;
				888
				889	ret = request_percpu_irq(irq, hf_nop_irq_handler, HYPERVISOR_TIMER_NAME,
				890	pdev);
				891	if (ret != 0) {
				892	pr_err("Error registering hypervisor timer IRQ %d: %d\n",
				893	irq, ret);
				894	return ret;
				895	}
				896	pr_info("Hafnium registered for IRQ %d\n", irq);
				897	ret = cpuhp_setup_state(CPUHP_AP_ONLINE_DYN,
				898	"hafnium/hypervisor_timer:starting",
				899	hf_starting_cpu, hf_dying_cpu);
				900	if (ret < 0) {
				901	pr_err("Error enabling timer on all CPUs: %d\n", ret);
Andrew Walbran	8d55e50	2019-02-05 11:42:08 +0000	[diff] [blame]	902	free_percpu_irq(irq, pdev);
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	903	return ret;
				904	}
Andrew Walbran	8d55e50	2019-02-05 11:42:08 +0000	[diff] [blame]	905	hf_cpuhp_state = ret;
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	906
				907	return 0;
				908	}
				909
				910	/**
				911	* Unregisters for the hypervisor timer interrupt.
				912	*/
				913	static int hf_int_driver_remove(struct platform_device *pdev)
				914	{
Andrew Walbran	8d55e50	2019-02-05 11:42:08 +0000	[diff] [blame]	915	/*
				916	* This will cause hf_dying_cpu to be called on each CPU, which will
				917	* disable the IRQs.
				918	*/
				919	cpuhp_remove_state(hf_cpuhp_state);
				920	free_percpu_irq(hf_irq, pdev);
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	921
				922	return 0;
				923	}
				924
				925	static const struct of_device_id hf_int_driver_id[] = {
				926	{.compatible = "arm,armv7-timer"},
				927	{.compatible = "arm,armv8-timer"},
				928	{}
				929	};
				930
				931	static struct platform_driver hf_int_driver = {
				932	.driver = {
				933	.name = HYPERVISOR_TIMER_NAME,
				934	.owner = THIS_MODULE,
				935	.of_match_table = of_match_ptr(hf_int_driver_id),
				936	},
				937	.probe = hf_int_driver_probe,
				938	.remove = hf_int_driver_remove,
				939	};
				940
				941	/**
Andrew Scull	bb7ae41	2018-09-28 21:07:15 +0100	[diff] [blame]	942	* Initializes the Hafnium driver by creating a thread for each vCPU of each
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	943	* virtual machine.
				944	*/
				945	static int __init hf_init(void)
				946	{
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	947	static const struct net_proto_family proto_family = {
				948	.family = PF_HF,
				949	.create = hf_sock_create,
				950	.owner = THIS_MODULE,
				951	};
Andrew Scull	bb7ae41	2018-09-28 21:07:15 +0100	[diff] [blame]	952	int64_t ret;
Andrew Walbran	2c6e751	2019-11-05 14:02:29 +0000	[diff] [blame]	953	struct spci_value spci_ret;
Andrew Walbran	4c96d0c	2019-06-25 18:32:56 +0100	[diff] [blame]	954	spci_vm_id_t i;
				955	spci_vcpu_index_t j;
				956	spci_vm_count_t secondary_vm_count;
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	957	uint32_t total_vcpu_count;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	958
Wedson Almeida Filho	f9e1192	2018-08-12 15:54:31 +0100	[diff] [blame]	959	/* Allocate a page for send and receive buffers. */
				960	hf_send_page = alloc_page(GFP_KERNEL);
				961	if (!hf_send_page) {
				962	pr_err("Unable to allocate send buffer\n");
				963	return -ENOMEM;
				964	}
				965
				966	hf_recv_page = alloc_page(GFP_KERNEL);
				967	if (!hf_recv_page) {
				968	__free_page(hf_send_page);
				969	pr_err("Unable to allocate receive buffer\n");
				970	return -ENOMEM;
				971	}
				972
				973	/*
				974	* Configure both addresses. Once configured, we cannot free these pages
				975	* because the hypervisor will use them, even if the module is
				976	* unloaded.
				977	*/
Andrew Walbran	2c6e751	2019-11-05 14:02:29 +0000	[diff] [blame]	978	spci_ret = spci_rxtx_map(page_to_phys(hf_send_page),
				979	page_to_phys(hf_recv_page));
				980	if (spci_ret.func != SPCI_SUCCESS_32) {
Wedson Almeida Filho	f9e1192	2018-08-12 15:54:31 +0100	[diff] [blame]	981	__free_page(hf_send_page);
				982	__free_page(hf_recv_page);
Wedson Almeida Filho	f9e1192	2018-08-12 15:54:31 +0100	[diff] [blame]	983	pr_err("Unable to configure VM\n");
Andrew Walbran	2c6e751	2019-11-05 14:02:29 +0000	[diff] [blame]	984	if (spci_ret.func == SPCI_ERROR_32)
				985	pr_err("SPCI error code %d\n", spci_ret.arg2);
				986	else
				987	pr_err("Unexpected SPCI function %#x\n", spci_ret.func);
Wedson Almeida Filho	f9e1192	2018-08-12 15:54:31 +0100	[diff] [blame]	988	return -EIO;
				989	}
				990
Andrew Walbran	4c96d0c	2019-06-25 18:32:56 +0100	[diff] [blame]	991	/* Get the number of secondary VMs. */
				992	secondary_vm_count = hf_vm_get_count() - 1;
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	993
				994	/* Confirm the maximum number of VMs looks sane. */
				995	BUILD_BUG_ON(CONFIG_HAFNIUM_MAX_VMS < 1);
				996	BUILD_BUG_ON(CONFIG_HAFNIUM_MAX_VMS > U16_MAX);
				997
				998	/* Validate the number of VMs. There must at least be the primary. */
Andrew Walbran	4c96d0c	2019-06-25 18:32:56 +0100	[diff] [blame]	999	if (secondary_vm_count > CONFIG_HAFNIUM_MAX_VMS - 1) {
Fuad Tabba	8523ccd	2019-07-31 15:37:29 +0100	[diff] [blame]	1000	pr_err("Number of VMs is out of range: %d\n",
Andrew Walbran	4c96d0c	2019-06-25 18:32:56 +0100	[diff] [blame]	1001	secondary_vm_count);
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	1002	return -EDQUOT;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1003	}
				1004
Andrew Scull	b722f95	2018-09-27 15:39:10 +0100	[diff] [blame]	1005	/* Only track the secondary VMs. */
Andrew Walbran	4c96d0c	2019-06-25 18:32:56 +0100	[diff] [blame]	1006	hf_vms = kmalloc_array(secondary_vm_count, sizeof(struct hf_vm),
				1007	GFP_KERNEL);
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1008	if (!hf_vms)
				1009	return -ENOMEM;
				1010
Jose Marinho	1cc6c75	2019-03-11 16:28:03 +0000	[diff] [blame]	1011	/* Cache the VM id for later usage. */
				1012	current_vm_id = hf_vm_get_id();
				1013
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1014	/* Initialize each VM. */
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	1015	total_vcpu_count = 0;
Andrew Walbran	4c96d0c	2019-06-25 18:32:56 +0100	[diff] [blame]	1016	for (i = 0; i < secondary_vm_count; i++) {
Andrew Scull	b3a61b5	2018-09-17 14:30:34 +0100	[diff] [blame]	1017	struct hf_vm *vm = &hf_vms[i];
Andrew Walbran	3eeb1de	2019-06-25 18:32:30 +0100	[diff] [blame]	1018	spci_vcpu_count_t vcpu_count;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1019
Andrew Scull	b722f95	2018-09-27 15:39:10 +0100	[diff] [blame]	1020	/* Adjust the ID as only the secondaries are tracked. */
Wedson Almeida Filho	ec84193	2019-01-22 23:07:50 +0000	[diff] [blame]	1021	vm->id = i + FIRST_SECONDARY_VM_ID;
Andrew Scull	b722f95	2018-09-27 15:39:10 +0100	[diff] [blame]	1022
Andrew Walbran	3eeb1de	2019-06-25 18:32:30 +0100	[diff] [blame]	1023	vcpu_count = hf_vcpu_get_count(vm->id);
				1024	if (vcpu_count < 0) {
				1025	pr_err("HF_VCPU_GET_COUNT failed for vm=%u: %d",
				1026	vm->id, vcpu_count);
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	1027	ret = -EIO;
				1028	goto fail_with_cleanup;
				1029	}
				1030
				1031	/* Avoid overflowing the vcpu count. */
Andrew Walbran	3eeb1de	2019-06-25 18:32:30 +0100	[diff] [blame]	1032	if (vcpu_count > (U32_MAX - total_vcpu_count)) {
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	1033	pr_err("Too many vcpus: %u\n", total_vcpu_count);
				1034	ret = -EDQUOT;
				1035	goto fail_with_cleanup;
				1036	}
				1037
				1038	/* Confirm the maximum number of VCPUs looks sane. */
				1039	BUILD_BUG_ON(CONFIG_HAFNIUM_MAX_VCPUS < 1);
				1040	BUILD_BUG_ON(CONFIG_HAFNIUM_MAX_VCPUS > U16_MAX);
				1041
				1042	/* Enforce the limit on vcpus. */
Andrew Walbran	3eeb1de	2019-06-25 18:32:30 +0100	[diff] [blame]	1043	total_vcpu_count += vcpu_count;
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	1044	if (total_vcpu_count > CONFIG_HAFNIUM_MAX_VCPUS) {
				1045	pr_err("Too many vcpus: %u\n", total_vcpu_count);
				1046	ret = -EDQUOT;
				1047	goto fail_with_cleanup;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1048	}
				1049
Andrew Walbran	3eeb1de	2019-06-25 18:32:30 +0100	[diff] [blame]	1050	vm->vcpu_count = vcpu_count;
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	1051	vm->vcpu = kmalloc_array(vm->vcpu_count, sizeof(struct hf_vcpu),
				1052	GFP_KERNEL);
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1053	if (!vm->vcpu) {
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	1054	ret = -ENOMEM;
				1055	goto fail_with_cleanup;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1056	}
				1057
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	1058	/* Update the number of initialized VMs. */
				1059	hf_vm_count = i + 1;
				1060
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1061	/* Create a kernel thread for each vcpu. */
				1062	for (j = 0; j < vm->vcpu_count; j++) {
Andrew Scull	b3a61b5	2018-09-17 14:30:34 +0100	[diff] [blame]	1063	struct hf_vcpu *vcpu = &vm->vcpu[j];
Andrew Scull	0177811	2019-01-14 15:37:53 +0000	[diff] [blame]	1064
				1065	vcpu->task =
				1066	kthread_create(hf_vcpu_thread, vcpu,
				1067	"vcpu_thread_%u_%u", vm->id, j);
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1068	if (IS_ERR(vcpu->task)) {
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	1069	pr_err("Error creating task (vm=%u,vcpu=%u): %ld\n",
				1070	vm->id, j, PTR_ERR(vcpu->task));
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1071	vm->vcpu_count = j;
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	1072	ret = PTR_ERR(vcpu->task);
				1073	goto fail_with_cleanup;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1074	}
				1075
				1076	get_task_struct(vcpu->task);
Andrew Scull	b722f95	2018-09-27 15:39:10 +0100	[diff] [blame]	1077	vcpu->vm = vm;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1078	vcpu->vcpu_index = j;
Wedson Almeida Filho	7fe6233	2018-12-15 03:09:57 +0000	[diff] [blame]	1079	atomic_set(&vcpu->abort_sleep, 0);
Andrew Scull	ece5ef4	2019-05-08 15:07:25 +0100	[diff] [blame]	1080	atomic_set(&vcpu->waiting_for_message, 0);
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1081	}
				1082	}
				1083
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	1084	/* Register protocol and socket family. */
				1085	ret = proto_register(&hf_sock_proto, 0);
				1086	if (ret) {
				1087	pr_err("Unable to register protocol: %lld\n", ret);
				1088	goto fail_with_cleanup;
				1089	}
				1090
				1091	ret = sock_register(&proto_family);
				1092	if (ret) {
				1093	pr_err("Unable to register Hafnium's socket family: %lld\n",
				1094	ret);
				1095	goto fail_unregister_proto;
				1096	}
				1097
				1098	/*
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	1099	* Register as a driver for the timer device, so we can register a
				1100	* handler for the hyperviser timer IRQ.
				1101	*/
				1102	ret = platform_driver_register(&hf_int_driver);
				1103	if (ret != 0) {
				1104	pr_err("Error registering timer driver %lld\n", ret);
				1105	goto fail_unregister_socket;
				1106	}
				1107
				1108	/*
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	1109	* Start running threads now that all is initialized.
				1110	*
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	1111	* Any failures from this point on must also unregister the driver with
				1112	* platform_driver_unregister().
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	1113	*/
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1114	for (i = 0; i < hf_vm_count; i++) {
Andrew Scull	b3a61b5	2018-09-17 14:30:34 +0100	[diff] [blame]	1115	struct hf_vm *vm = &hf_vms[i];
Andrew Scull	0177811	2019-01-14 15:37:53 +0000	[diff] [blame]	1116
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1117	for (j = 0; j < vm->vcpu_count; j++)
				1118	wake_up_process(vm->vcpu[j].task);
				1119	}
				1120
				1121	/* Dump vm/vcpu count info. */
Andrew Scull	bb7ae41	2018-09-28 21:07:15 +0100	[diff] [blame]	1122	pr_info("Hafnium successfully loaded with %u VMs:\n", hf_vm_count);
Andrew Scull	b722f95	2018-09-27 15:39:10 +0100	[diff] [blame]	1123	for (i = 0; i < hf_vm_count; i++) {
				1124	struct hf_vm *vm = &hf_vms[i];
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	1125
Andrew Scull	bb7ae41	2018-09-28 21:07:15 +0100	[diff] [blame]	1126	pr_info("\tVM %u: %u vCPUS\n", vm->id, vm->vcpu_count);
Andrew Scull	b722f95	2018-09-27 15:39:10 +0100	[diff] [blame]	1127	}
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1128
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1129	return 0;
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	1130
Andrew Walbran	b3ca1dc	2019-01-30 17:13:44 +0000	[diff] [blame]	1131	fail_unregister_socket:
				1132	sock_unregister(PF_HF);
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	1133	fail_unregister_proto:
				1134	proto_unregister(&hf_sock_proto);
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	1135	fail_with_cleanup:
				1136	hf_free_resources();
				1137	return ret;
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1138	}
				1139
				1140	/**
Andrew Scull	bb7ae41	2018-09-28 21:07:15 +0100	[diff] [blame]	1141	* Frees up all resources used by the Hafnium driver in preparation for
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1142	* unloading it.
				1143	*/
				1144	static void __exit hf_exit(void)
				1145	{
Andrew Scull	bb7ae41	2018-09-28 21:07:15 +0100	[diff] [blame]	1146	pr_info("Preparing to unload Hafnium\n");
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	1147	sock_unregister(PF_HF);
				1148	proto_unregister(&hf_sock_proto);
Andrew Scull	82257c4	2018-10-01 10:37:48 +0100	[diff] [blame]	1149	hf_free_resources();
Andrew Walbran	8d55e50	2019-02-05 11:42:08 +0000	[diff] [blame]	1150	platform_driver_unregister(&hf_int_driver);
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1151	pr_info("Hafnium ready to unload\n");
				1152	}
				1153
Wedson Almeida Filho	1ee3565	2018-12-24 01:36:48 +0000	[diff] [blame]	1154	MODULE_LICENSE("GPL v2");
Wedson Almeida Filho	2f62b42	2018-06-19 06:44:32 +0100	[diff] [blame]	1155
				1156	module_init(hf_init);
				1157	module_exit(hf_exit);