diff --git a/sys/compat/linuxkpi/common/include/linux/compat.h b/sys/compat/linuxkpi/common/include/linux/compat.h
index d1a02f612f42..7922e884beb1 100644
--- a/sys/compat/linuxkpi/common/include/linux/compat.h
+++ b/sys/compat/linuxkpi/common/include/linux/compat.h
@@ -1,62 +1,68 @@
 /*-
  * Copyright (c) 2010 Isilon Systems, Inc.
  * Copyright (c) 2010 iX Systems, Inc.
  * Copyright (c) 2010 Panasas, Inc.
  * Copyright (c) 2013-2017 Mellanox Technologies, Ltd.
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice unmodified, this list of conditions, and the following
  *    disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  */
 #ifndef	_LINUXKPI_LINUX_COMPAT_H_
 #define	_LINUXKPI_LINUX_COMPAT_H_
 
 #include <sys/param.h>
 #include <sys/proc.h>
 #include <sys/malloc.h>
 
+#if defined(__aarch64__) || defined(__arm__) || defined(__amd64__) ||	\
+    defined(__i386__) || defined(__powerpc64__)
+#define	LKPI_HAVE_FPU_CTX
+#endif
+
 struct domainset;
 struct thread;
 struct task_struct;
 
 extern int linux_alloc_current(struct thread *, int flags);
 extern void linux_free_current(struct task_struct *);
 extern struct domainset *linux_get_vm_domain_set(int node);
+extern int linux_set_fpu_ctx(struct task_struct *);
 
 static inline void
 linux_set_current(struct thread *td)
 {
 	if (__predict_false(td->td_lkpi_task == NULL))
 		lkpi_alloc_current(td, M_WAITOK);
 }
 
 static inline int
 linux_set_current_flags(struct thread *td, int flags)
 {
 	if (__predict_false(td->td_lkpi_task == NULL))
 		return (lkpi_alloc_current(td, flags));
 	return (0);
 }
 
 #define	compat_ptr(x)		((void *)(uintptr_t)x)
 #define	ptr_to_compat(x)	((uintptr_t)x)
 
 #endif	/* _LINUXKPI_LINUX_COMPAT_H_ */
diff --git a/sys/compat/linuxkpi/common/include/linux/sched.h b/sys/compat/linuxkpi/common/include/linux/sched.h
index 8cb6b12100d5..77c4f6d3f80f 100644
--- a/sys/compat/linuxkpi/common/include/linux/sched.h
+++ b/sys/compat/linuxkpi/common/include/linux/sched.h
@@ -1,242 +1,244 @@
 /*-
  * Copyright (c) 2010 Isilon Systems, Inc.
  * Copyright (c) 2010 iX Systems, Inc.
  * Copyright (c) 2010 Panasas, Inc.
  * Copyright (c) 2013-2018 Mellanox Technologies, Ltd.
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice unmodified, this list of conditions, and the following
  *    disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  */
 #ifndef	_LINUXKPI_LINUX_SCHED_H_
 #define	_LINUXKPI_LINUX_SCHED_H_
 
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/proc.h>
 #include <sys/rtprio.h>
 #include <sys/sched.h>
 #include <sys/sleepqueue.h>
 #include <sys/time.h>
 
 #include <linux/bitmap.h>
 #include <linux/compat.h>
 #include <linux/completion.h>
 #include <linux/hrtimer.h>
 #include <linux/mm_types.h>
 #include <linux/pid.h>
 #include <linux/slab.h>
 #include <linux/string.h>
 #include <linux/spinlock.h>
 #include <linux/time.h>
 
 #include <linux/sched/mm.h>
 
 #include <asm/atomic.h>
 
 #define	MAX_SCHEDULE_TIMEOUT	INT_MAX
 
 #define	TASK_RUNNING		0x0000
 #define	TASK_INTERRUPTIBLE	0x0001
 #define	TASK_UNINTERRUPTIBLE	0x0002
 #define	TASK_NORMAL		(TASK_INTERRUPTIBLE | TASK_UNINTERRUPTIBLE)
 #define	TASK_WAKING		0x0100
 #define	TASK_PARKED		0x0200
 
 #define	TASK_COMM_LEN		(MAXCOMLEN + 1)
 
 struct seq_file;
+struct fpu_kern_ctx;
 
 struct work_struct;
 struct task_struct {
 	struct thread *task_thread;
 	struct mm_struct *mm;
 	linux_task_fn_t *task_fn;
 	void   *task_data;
 	int	task_ret;
 	atomic_t usage;
 	atomic_t state;
 	atomic_t kthread_flags;
 	pid_t	pid;	/* BSD thread ID */
 	const char    *comm;
 	void   *bsd_ioctl_data;
 	unsigned bsd_ioctl_len;
 	struct completion parked;
 	struct completion exited;
 #define	TS_RCU_TYPE_MAX 2
 	TAILQ_ENTRY(task_struct) rcu_entry[TS_RCU_TYPE_MAX];
 	int rcu_recurse[TS_RCU_TYPE_MAX];
 	int bsd_interrupt_value;
 	struct work_struct *work;	/* current work struct, if set */
 	struct task_struct *group_leader;
 	unsigned rcu_section[TS_RCU_TYPE_MAX];
 	unsigned int fpu_ctx_level;
+	struct fpu_kern_ctx *fpu_ctx;
 };
 
 #define	current	({ \
 	struct thread *__td = curthread; \
 	linux_set_current(__td); \
 	((struct task_struct *)__td->td_lkpi_task); \
 })
 
 #define	task_pid_group_leader(task) (task)->task_thread->td_proc->p_pid
 #define	task_pid(task)		((task)->pid)
 #define	task_pid_nr(task)	((task)->pid)
 #define	task_pid_vnr(task)	((task)->pid)
 #define	get_pid(x)		(x)
 #define	put_pid(x)		do { } while (0)
 #define	current_euid()	(curthread->td_ucred->cr_uid)
 #define	task_euid(task)	((task)->task_thread->td_ucred->cr_uid)
 
 #define	get_task_state(task)		atomic_read(&(task)->state)
 #define	set_task_state(task, x)		atomic_set(&(task)->state, (x))
 #define	__set_task_state(task, x)	((task)->state.counter = (x))
 #define	set_current_state(x)		set_task_state(current, x)
 #define	__set_current_state(x)		__set_task_state(current, x)
 
 static inline void
 get_task_struct(struct task_struct *task)
 {
 	atomic_inc(&task->usage);
 }
 
 static inline void
 put_task_struct(struct task_struct *task)
 {
 	if (atomic_dec_and_test(&task->usage))
 		linux_free_current(task);
 }
 
 #define	cond_resched()	do { if (!cold) sched_relinquish(curthread); } while (0)
 
 #define	yield()		kern_yield(PRI_UNCHANGED)
 #define	sched_yield()	sched_relinquish(curthread)
 
 #define	need_resched()	(curthread->td_owepreempt || \
     td_ast_pending(curthread, TDA_SCHED))
 
 static inline int
 cond_resched_lock(spinlock_t *lock)
 {
 
 	if (need_resched() == 0)
 		return (0);
 	spin_unlock(lock);
 	cond_resched();
 	spin_lock(lock);
 	return (1);
 }
 
 bool linux_signal_pending(struct task_struct *task);
 bool linux_fatal_signal_pending(struct task_struct *task);
 bool linux_signal_pending_state(long state, struct task_struct *task);
 void linux_send_sig(int signo, struct task_struct *task);
 
 #define	signal_pending(task)		linux_signal_pending(task)
 #define	fatal_signal_pending(task)	linux_fatal_signal_pending(task)
 #define	signal_pending_state(state, task)		\
 	linux_signal_pending_state(state, task)
 #define	send_sig(signo, task, priv) do {		\
 	CTASSERT((priv) == 0);				\
 	linux_send_sig(signo, task);			\
 } while (0)
 
 int linux_schedule_timeout(int timeout);
 
 static inline void
 linux_schedule_save_interrupt_value(struct task_struct *task, int value)
 {
 	task->bsd_interrupt_value = value;
 }
 
 bool linux_task_exiting(struct task_struct *task);
 
 #define	current_exiting() \
 	linux_task_exiting(current)
 
 static inline int
 linux_schedule_get_interrupt_value(struct task_struct *task)
 {
 	int value = task->bsd_interrupt_value;
 	task->bsd_interrupt_value = 0;
 	return (value);
 }
 
 static inline void
 schedule(void)
 {
 	(void)linux_schedule_timeout(MAX_SCHEDULE_TIMEOUT);
 }
 
 #define	schedule_timeout(timeout)			\
 	linux_schedule_timeout(timeout)
 #define	schedule_timeout_killable(timeout)		\
 	schedule_timeout_interruptible(timeout)
 #define	schedule_timeout_interruptible(timeout) ({	\
 	set_current_state(TASK_INTERRUPTIBLE);		\
 	schedule_timeout(timeout);			\
 })
 #define	schedule_timeout_uninterruptible(timeout) ({	\
 	set_current_state(TASK_UNINTERRUPTIBLE);	\
 	schedule_timeout(timeout);			\
 })
 
 #define	io_schedule()			schedule()
 #define	io_schedule_timeout(timeout)	schedule_timeout(timeout)
 
 static inline uint64_t
 local_clock(void)
 {
 	struct timespec ts;
 
 	nanotime(&ts);
 	return ((uint64_t)ts.tv_sec * NSEC_PER_SEC + ts.tv_nsec);
 }
 
 static inline const char *
 get_task_comm(char *buf, struct task_struct *task)
 {
 
 	buf[0] = 0; /* buffer is too small */
 	return (task->comm);
 }
 
 static inline void
 sched_set_fifo(struct task_struct *t)
 {
 	struct rtprio rtp;
 
 	rtp.prio = (RTP_PRIO_MIN + RTP_PRIO_MAX) / 2;
 	rtp.type = RTP_PRIO_FIFO;
 	rtp_to_pri(&rtp, t->task_thread);
 }
 
 static inline void
 sched_set_fifo_low(struct task_struct *t)
 {
 	struct rtprio rtp;
 
 	rtp.prio = RTP_PRIO_MAX;	/* lowest priority */
 	rtp.type = RTP_PRIO_FIFO;
 	rtp_to_pri(&rtp, t->task_thread);
 }
 
 #endif	/* _LINUXKPI_LINUX_SCHED_H_ */
diff --git a/sys/compat/linuxkpi/common/src/linux_current.c b/sys/compat/linuxkpi/common/src/linux_current.c
index bec53384361f..668185094cbe 100644
--- a/sys/compat/linuxkpi/common/src/linux_current.c
+++ b/sys/compat/linuxkpi/common/src/linux_current.c
@@ -1,343 +1,361 @@
 /*-
  * Copyright (c) 2017 Hans Petter Selasky
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice unmodified, this list of conditions, and the following
  *    disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  */
 
 #include <sys/cdefs.h>
 #ifdef __amd64__
 #define	DEV_APIC
 #elif defined(__i386__)
 #include "opt_apic.h"
 #endif
 
 #include <linux/compat.h>
 #include <linux/completion.h>
 #include <linux/mm.h>
 #include <linux/kthread.h>
 #include <linux/moduleparam.h>
 
 #include <sys/kernel.h>
 #include <sys/eventhandler.h>
 #include <sys/malloc.h>
 #include <sys/sysctl.h>
 #include <vm/uma.h>
 
+#ifdef LKPI_HAVE_FPU_CTX
+#include <machine/fpu.h>
+#endif
+
 #ifdef DEV_APIC
 extern u_int first_msi_irq, num_msi_irqs;
 #endif
 
 static eventhandler_tag linuxkpi_thread_dtor_tag;
 
 static uma_zone_t linux_current_zone;
 static uma_zone_t linux_mm_zone;
 
 /* check if another thread already has a mm_struct */
 static struct mm_struct *
 find_other_mm(struct proc *p)
 {
 	struct thread *td;
 	struct task_struct *ts;
 	struct mm_struct *mm;
 
 	PROC_LOCK_ASSERT(p, MA_OWNED);
 	FOREACH_THREAD_IN_PROC(p, td) {
 		ts = td->td_lkpi_task;
 		if (ts == NULL)
 			continue;
 		mm = ts->mm;
 		if (mm == NULL)
 			continue;
 		/* try to share other mm_struct */
 		if (atomic_inc_not_zero(&mm->mm_users))
 			return (mm);
 	}
 	return (NULL);
 }
 
 int
 linux_alloc_current(struct thread *td, int flags)
 {
 	struct proc *proc;
 	struct task_struct *ts;
 	struct mm_struct *mm, *mm_other;
 
 	MPASS(td->td_lkpi_task == NULL);
 
 	if ((td->td_pflags & TDP_ITHREAD) != 0 || !THREAD_CAN_SLEEP()) {
 		flags &= ~M_WAITOK;
 		flags |= M_NOWAIT | M_USE_RESERVE;
 	}
 
 	ts = uma_zalloc(linux_current_zone, flags | M_ZERO);
 	if (ts == NULL) {
 		if ((flags & (M_WAITOK | M_NOWAIT)) == M_WAITOK)
 			panic("linux_alloc_current: failed to allocate task");
 		return (ENOMEM);
 	}
 	mm = NULL;
 
 	/* setup new task structure */
 	atomic_set(&ts->kthread_flags, 0);
 	ts->task_thread = td;
 	ts->comm = td->td_name;
 	ts->pid = td->td_tid;
 	ts->group_leader = ts;
 	atomic_set(&ts->usage, 1);
 	atomic_set(&ts->state, TASK_RUNNING);
 	init_completion(&ts->parked);
 	init_completion(&ts->exited);
 
 	proc = td->td_proc;
 
 	PROC_LOCK(proc);
 	mm_other = find_other_mm(proc);
 
 	/* use allocated mm_struct as a fallback */
 	if (mm_other == NULL) {
 		PROC_UNLOCK(proc);
 		mm = uma_zalloc(linux_mm_zone, flags | M_ZERO);
 		if (mm == NULL) {
 			if ((flags & (M_WAITOK | M_NOWAIT)) == M_WAITOK)
 				panic(
 			    "linux_alloc_current: failed to allocate mm");
 			uma_zfree(linux_current_zone, mm);
 			return (ENOMEM);
 		}
 
 		PROC_LOCK(proc);
 		mm_other = find_other_mm(proc);
 		if (mm_other == NULL) {
 			/* setup new mm_struct */
 			init_rwsem(&mm->mmap_sem);
 			atomic_set(&mm->mm_count, 1);
 			atomic_set(&mm->mm_users, 1);
 			/* set mm_struct pointer */
 			ts->mm = mm;
 			/* clear pointer to not free memory */
 			mm = NULL;
 		} else {
 			ts->mm = mm_other;
 		}
 	} else {
 		ts->mm = mm_other;
 	}
 
 	/* store pointer to task struct */
 	td->td_lkpi_task = ts;
 	PROC_UNLOCK(proc);
 
 	/* free mm_struct pointer, if any */
 	uma_zfree(linux_mm_zone, mm);
 
 	return (0);
 }
 
+int
+linux_set_fpu_ctx(struct task_struct *task)
+{
+#ifdef LKPI_HAVE_FPU_CTX
+	if (task->fpu_ctx == NULL && curthread->td_critnest == 0)
+		task->fpu_ctx = fpu_kern_alloc_ctx(FPU_KERN_NOWAIT);
+#endif
+	return (task->fpu_ctx != NULL ? 0 : ENOMEM);
+}
+
 struct mm_struct *
 linux_get_task_mm(struct task_struct *task)
 {
 	struct mm_struct *mm;
 
 	mm = task->mm;
 	if (mm != NULL) {
 		atomic_inc(&mm->mm_users);
 		return (mm);
 	}
 	return (NULL);
 }
 
 void
 linux_mm_dtor(struct mm_struct *mm)
 {
 	uma_zfree(linux_mm_zone, mm);
 }
 
 void
 linux_free_current(struct task_struct *ts)
 {
 	mmput(ts->mm);
+#ifdef LKPI_HAVE_FPU_CTX
+	if (ts->fpu_ctx != NULL)
+		fpu_kern_free_ctx(ts->fpu_ctx);
+#endif
 	uma_zfree(linux_current_zone, ts);
 }
 
 static void
 linuxkpi_thread_dtor(void *arg __unused, struct thread *td)
 {
 	struct task_struct *ts;
 
 	ts = td->td_lkpi_task;
 	if (ts == NULL)
 		return;
 
 	td->td_lkpi_task = NULL;
 	put_task_struct(ts);
 }
 
 static struct task_struct *
 linux_get_pid_task_int(pid_t pid, const bool do_get)
 {
 	struct thread *td;
 	struct proc *p;
 	struct task_struct *ts;
 
 	if (pid > PID_MAX) {
 		/* try to find corresponding thread */
 		td = tdfind(pid, -1);
 		if (td != NULL) {
 			ts = td->td_lkpi_task;
 			if (do_get && ts != NULL)
 				get_task_struct(ts);
 			PROC_UNLOCK(td->td_proc);
 			return (ts);
 		}
 	} else {
 		/* try to find corresponding procedure */
 		p = pfind(pid);
 		if (p != NULL) {
 			FOREACH_THREAD_IN_PROC(p, td) {
 				ts = td->td_lkpi_task;
 				if (ts != NULL) {
 					if (do_get)
 						get_task_struct(ts);
 					PROC_UNLOCK(p);
 					return (ts);
 				}
 			}
 			PROC_UNLOCK(p);
 		}
 	}
 	return (NULL);
 }
 
 struct task_struct *
 linux_pid_task(pid_t pid)
 {
 	return (linux_get_pid_task_int(pid, false));
 }
 
 struct task_struct *
 linux_get_pid_task(pid_t pid)
 {
 	return (linux_get_pid_task_int(pid, true));
 }
 
 bool
 linux_task_exiting(struct task_struct *task)
 {
 	struct thread *td;
 	struct proc *p;
 	bool ret;
 
 	ret = false;
 
 	/* try to find corresponding thread */
 	td = tdfind(task->pid, -1);
 	if (td != NULL) {
 		p = td->td_proc;
 	} else {
 		/* try to find corresponding procedure */
 		p = pfind(task->pid);
 	}
 
 	if (p != NULL) {
 		if ((p->p_flag & P_WEXIT) != 0)
 			ret = true;
 		PROC_UNLOCK(p);
 	}
 	return (ret);
 }
 
 static int lkpi_task_resrv;
 SYSCTL_INT(_compat_linuxkpi, OID_AUTO, task_struct_reserve,
     CTLFLAG_RDTUN | CTLFLAG_NOFETCH, &lkpi_task_resrv, 0,
     "Number of struct task and struct mm to reserve for non-sleepable "
     "allocations");
 
 static void
 linux_current_init(void *arg __unused)
 {
 	TUNABLE_INT_FETCH("compat.linuxkpi.task_struct_reserve",
 	    &lkpi_task_resrv);
 	if (lkpi_task_resrv == 0) {
 #ifdef DEV_APIC
 		/*
 		 * Number of interrupt threads plus per-cpu callout
 		 * SWI threads.
 		 */
 		lkpi_task_resrv = first_msi_irq + num_msi_irqs + MAXCPU;
 #else
 		lkpi_task_resrv = 1024;		/* XXXKIB arbitrary */
 #endif
 	}
 	linux_current_zone = uma_zcreate("lkpicurr",
 	    sizeof(struct task_struct), NULL, NULL, NULL, NULL,
 	    UMA_ALIGN_PTR, 0);
 	uma_zone_reserve(linux_current_zone, lkpi_task_resrv);
 	uma_prealloc(linux_current_zone, lkpi_task_resrv);
 	linux_mm_zone = uma_zcreate("lkpimm",
 	    sizeof(struct task_struct), NULL, NULL, NULL, NULL,
 	    UMA_ALIGN_PTR, 0);
 	uma_zone_reserve(linux_mm_zone, lkpi_task_resrv);
 	uma_prealloc(linux_mm_zone, lkpi_task_resrv);
 
 	atomic_thread_fence_seq_cst();
 
 	linuxkpi_thread_dtor_tag = EVENTHANDLER_REGISTER(thread_dtor,
 	    linuxkpi_thread_dtor, NULL, EVENTHANDLER_PRI_ANY);
 	lkpi_alloc_current = linux_alloc_current;
 }
 SYSINIT(linux_current, SI_SUB_EVENTHANDLER + 1, SI_ORDER_SECOND,
     linux_current_init, NULL);
 
 static void
 linux_current_uninit(void *arg __unused)
 {
 	struct proc *p;
 	struct task_struct *ts;
 	struct thread *td;
 
 	lkpi_alloc_current = linux_alloc_current_noop;
 
 	atomic_thread_fence_seq_cst();
 
 	sx_slock(&allproc_lock);
 	FOREACH_PROC_IN_SYSTEM(p) {
 		PROC_LOCK(p);
 		FOREACH_THREAD_IN_PROC(p, td) {
 			if ((ts = td->td_lkpi_task) != NULL) {
 				td->td_lkpi_task = NULL;
 				put_task_struct(ts);
 			}
 		}
 		PROC_UNLOCK(p);
 	}
 	sx_sunlock(&allproc_lock);
 
 	thread_reap_barrier();
 
 	EVENTHANDLER_DEREGISTER(thread_dtor, linuxkpi_thread_dtor_tag);
 
 	uma_zdestroy(linux_current_zone);
 	uma_zdestroy(linux_mm_zone);
 }
 SYSUNINIT(linux_current, SI_SUB_EVENTHANDLER + 1, SI_ORDER_SECOND,
     linux_current_uninit, NULL);
diff --git a/sys/compat/linuxkpi/common/src/linux_fpu.c b/sys/compat/linuxkpi/common/src/linux_fpu.c
index b26dce98774b..d510bc208b88 100644
--- a/sys/compat/linuxkpi/common/src/linux_fpu.c
+++ b/sys/compat/linuxkpi/common/src/linux_fpu.c
@@ -1,73 +1,79 @@
 /*-
  * SPDX-License-Identifier: BSD-2-Clause
  * 
  * Copyright (c) 2020 Val Packett <val@packett.cool>
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 
  * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #include <sys/types.h>
 #include <sys/param.h>
 #include <sys/proc.h>
 #include <sys/kernel.h>
 
+#include <linux/compat.h>
 #include <linux/sched.h>
 
 #include <asm/fpu/api.h>
 
-#if defined(__aarch64__) || defined(__amd64__) || defined(__i386__)
+#ifdef LKPI_HAVE_FPU_CTX
 
 #include <machine/fpu.h>
 
 /*
  * Technically the Linux API isn't supposed to allow nesting sections
  * either, but currently used versions of GPU drivers rely on nesting
  * working, so we only enter the section on the outermost level.
  */
 
 void
 lkpi_kernel_fpu_begin(void)
 {
-	if ((current->fpu_ctx_level)++ == 0)
-		fpu_kern_enter(curthread, NULL, FPU_KERN_NOCTX);
+	int err;
+
+	if ((current->fpu_ctx_level)++ == 0) {
+		err = linux_set_fpu_ctx(current);
+		fpu_kern_enter(curthread, current->fpu_ctx,
+		    err == 0 ? FPU_KERN_KTHR : FPU_KERN_NOCTX);
+	}
 }
 
 void
 lkpi_kernel_fpu_end(void)
 {
 	if (--(current->fpu_ctx_level) == 0)
-		fpu_kern_leave(curthread, NULL);
+		fpu_kern_leave(curthread, current->fpu_ctx);
 }
 
 #else
 
 void
 lkpi_kernel_fpu_begin(void)
 {
 }
 
 void
 lkpi_kernel_fpu_end(void)
 {
 }
 
 #endif