/* * Copyright (c) 2010-2014 Wind River Systems, Inc. * * SPDX-License-Identifier: Apache-2.0 */ /** * @file * @brief Floating point register sharing routines * * This module allows multiple preemptible threads to safely share the system's * floating point registers, by allowing the system to save FPU state info * in a thread's stack region when a preemptive context switch occurs. * * Note: If the kernel has been built without floating point register sharing * support (CONFIG_FPU_SHARING), the floating point registers can still be used * safely by one or more cooperative threads OR by a single preemptive thread, * but not by both. * * This code is not necessary for systems with CONFIG_EAGER_FPU_SHARING, as * the floating point context is unconditionally saved/restored with every * context switch. * * The floating point register sharing mechanism is designed for minimal * intrusiveness. Floating point state saving is only performed for threads * that explicitly indicate they are using FPU registers, to avoid impacting * the stack size requirements of all other threads. Also, the SSE registers * are only saved for threads that actually used them. For those threads that * do require floating point state saving, a "lazy save/restore" mechanism * is employed so that the FPU's register sets are only switched in and out * when absolutely necessary; this avoids wasting effort preserving them when * there is no risk that they will be altered, or when there is no need to * preserve their contents. * * WARNING * The use of floating point instructions by ISRs is not supported by the * kernel. * * INTERNAL * The kernel sets CR0[TS] to 0 only for threads that require FP register * sharing. All other threads have CR0[TS] set to 1 so that an attempt * to perform an FP operation will cause an exception, allowing the kernel * to enable FP register sharing on its behalf. */ #include #include /* SSE control/status register default value (used by assembler code) */ extern uint32_t _sse_mxcsr_default_value; /** * @brief Disallow use of floating point capabilities * * This routine sets CR0[TS] to 1, which disallows the use of FP instructions * by the currently executing thread. */ static inline void z_FpAccessDisable(void) { void *tempReg; __asm__ volatile( "movl %%cr0, %0;\n\t" "orl $0x8, %0;\n\t" "movl %0, %%cr0;\n\t" : "=r"(tempReg) : : "memory"); } /** * @brief Save non-integer context information * * This routine saves the system's "live" non-integer context into the * specified area. If the specified thread supports SSE then * x87/MMX/SSEx thread info is saved, otherwise only x87/MMX thread is saved. * Function is invoked by FpCtxSave(struct k_thread *thread) */ static inline void z_do_fp_regs_save(void *preemp_float_reg) { __asm__ volatile("fnsave (%0);\n\t" : : "r"(preemp_float_reg) : "memory"); } /** * @brief Save non-integer context information * * This routine saves the system's "live" non-integer context into the * specified area. If the specified thread supports SSE then * x87/MMX/SSEx thread info is saved, otherwise only x87/MMX thread is saved. * Function is invoked by FpCtxSave(struct k_thread *thread) */ static inline void z_do_fp_and_sse_regs_save(void *preemp_float_reg) { __asm__ volatile("fxsave (%0);\n\t" : : "r"(preemp_float_reg) : "memory"); } /** * @brief Initialize floating point register context information. * * This routine initializes the system's "live" floating point registers. */ static inline void z_do_fp_regs_init(void) { __asm__ volatile("fninit\n\t"); } /** * @brief Initialize SSE register context information. * * This routine initializes the system's "live" SSE registers. */ static inline void z_do_sse_regs_init(void) { __asm__ volatile("ldmxcsr _sse_mxcsr_default_value\n\t"); } /* * Save a thread's floating point context information. * * This routine saves the system's "live" floating point context into the * specified thread control block. The SSE registers are saved only if the * thread is actually using them. */ static void FpCtxSave(struct k_thread *thread) { #ifdef CONFIG_X86_SSE if ((thread->base.user_options & K_SSE_REGS) != 0) { z_do_fp_and_sse_regs_save(&thread->arch.preempFloatReg); return; } #endif z_do_fp_regs_save(&thread->arch.preempFloatReg); } /* * Initialize a thread's floating point context information. * * This routine initializes the system's "live" floating point context. * The SSE registers are initialized only if the thread is actually using them. */ static inline void FpCtxInit(struct k_thread *thread) { z_do_fp_regs_init(); #ifdef CONFIG_X86_SSE if ((thread->base.user_options & K_SSE_REGS) != 0) { z_do_sse_regs_init(); } #endif } /* * Enable preservation of floating point context information. * * The transition from "non-FP supporting" to "FP supporting" must be done * atomically to avoid confusing the floating point logic used by z_swap(), so * this routine locks interrupts to ensure that a context switch does not occur. * The locking isn't really needed when the routine is called by a cooperative * thread (since context switching can't occur), but it is harmless. */ void z_float_enable(struct k_thread *thread, unsigned int options) { unsigned int imask; struct k_thread *fp_owner; if (!thread) { return; } /* Ensure a preemptive context switch does not occur */ imask = irq_lock(); /* Indicate thread requires floating point context saving */ thread->base.user_options |= (uint8_t)options; /* * The current thread might not allow FP instructions, so clear CR0[TS] * so we can use them. (CR0[TS] gets restored later on, if necessary.) */ __asm__ volatile("clts\n\t"); /* * Save existing floating point context (since it is about to change), * but only if the FPU is "owned" by an FP-capable task that is * currently handling an interrupt or exception (meaning its FP context * must be preserved). */ fp_owner = _kernel.current_fp; if (fp_owner != NULL) { if ((fp_owner->arch.flags & X86_THREAD_FLAG_ALL) != 0) { FpCtxSave(fp_owner); } } /* Now create a virgin FP context */ FpCtxInit(thread); /* Associate the new FP context with the specified thread */ if (thread == arch_current_thread()) { /* * When enabling FP support for the current thread, just claim * ownership of the FPU and leave CR0[TS] unset. * * (The FP context is "live" in hardware, not saved in TCS.) */ _kernel.current_fp = thread; } else { /* * When enabling FP support for someone else, assign ownership * of the FPU to them (unless we need it ourselves). */ if ((arch_current_thread()->base.user_options & _FP_USER_MASK) == 0) { /* * We are not FP-capable, so mark FPU as owned by the * thread we've just enabled FP support for, then * disable our own FP access by setting CR0[TS] back * to its original state. */ _kernel.current_fp = thread; z_FpAccessDisable(); } else { /* * We are FP-capable (and thus had FPU ownership on * entry), so save the new FP context in their TCS, * leave FPU ownership with self, and leave CR0[TS] * unset. * * The saved FP context is needed in case the thread * we enabled FP support for is currently pre-empted, * since z_swap() uses it to restore FP context when * the thread re-activates. * * Saving the FP context reinits the FPU, and thus * our own FP context, but that's OK since it didn't * need to be preserved. (i.e. We aren't currently * handling an interrupt or exception.) */ FpCtxSave(thread); } } irq_unlock(imask); } /** * Disable preservation of floating point context information. * * The transition from "FP supporting" to "non-FP supporting" must be done * atomically to avoid confusing the floating point logic used by z_swap(), so * this routine locks interrupts to ensure that a context switch does not occur. * The locking isn't really needed when the routine is called by a cooperative * thread (since context switching can't occur), but it is harmless. */ int z_float_disable(struct k_thread *thread) { unsigned int imask; /* Ensure a preemptive context switch does not occur */ imask = irq_lock(); /* Disable all floating point capabilities for the thread */ thread->base.user_options &= ~_FP_USER_MASK; if (thread == arch_current_thread()) { z_FpAccessDisable(); _kernel.current_fp = (struct k_thread *)0; } else { if (_kernel.current_fp == thread) { _kernel.current_fp = (struct k_thread *)0; } } irq_unlock(imask); return 0; } /* * Handler for "device not available" exception. * * This routine is registered to handle the "device not available" exception * (vector = 7). * * The processor will generate this exception if any x87 FPU, MMX, or SSEx * instruction is executed while CR0[TS]=1. The handler then enables the * current thread to use all supported floating point registers. */ void _FpNotAvailableExcHandler(struct arch_esf *pEsf) { ARG_UNUSED(pEsf); /* * Assume the exception did not occur in an ISR. * (In other words, CPU cycles will not be consumed to perform * error checking to ensure the exception was not generated in an ISR.) */ /* Enable highest level of FP capability configured into the kernel */ k_float_enable(arch_current_thread(), _FP_USER_MASK); } _EXCEPTION_CONNECT_NOCODE(_FpNotAvailableExcHandler, IV_DEVICE_NOT_AVAILABLE, 0);