/* * CDDL HEADER START * * The contents of this file are subject to the terms of the * Common Development and Distribution License (the "License"). * You may not use this file except in compliance with the License. * * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE * or http://www.opensolaris.org/os/licensing. * See the License for the specific language governing permissions * and limitations under the License. * * When distributing Covered Code, include this CDDL HEADER in each * file and include the License file at usr/src/OPENSOLARIS.LICENSE. * If applicable, add the following below this CDDL HEADER, with the * fields enclosed by brackets "[]" replaced with your own identifying * information: Portions Copyright [yyyy] [name of copyright owner] * * CDDL HEADER END */ /* * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved. * Copyright (c) 2018, Joyent, Inc. */ /* * Floating point configuration. */ #include #include #include #include #include #include #include #include #define XMM_ALIGN 16 /* * See section 10.5.1 in the Intel 64 and IA-32 Architectures Software * Developer’s Manual, Volume 1. */ #define FXSAVE_ALIGN 16 /* * See section 13.4 in the Intel 64 and IA-32 Architectures Software * Developer’s Manual, Volume 1. */ #define XSAVE_ALIGN 64 /* * If fpu_exists is non-zero, fpu_probe will attempt to use any * hardware FPU (subject to other constraints, see below). If * fpu_exists is zero, fpu_probe will report that there is no * FPU even if there is one. */ int fpu_exists = 1; int fp_kind = FP_387; /* * The variable fpu_ignored is provided to allow other code to * determine whether emulation is being done because there is * no FPU or because of an override requested via /etc/system. */ int fpu_ignored = 0; /* * Used by ppcopy and ppzero to determine whether or not to use the * SSE-based pagecopy and pagezero routines */ int use_sse_pagecopy = 0; int use_sse_pagezero = 0; int use_sse_copy = 0; #if defined(__xpv) /* * Use of SSE or otherwise is forcibly configured for us by the hypervisor. */ #define ENABLE_SSE() #define DISABLE_SSE() #else /* __xpv */ #define ENABLE_SSE() setcr4(CR4_ENABLE_SSE_FLAGS(getcr4())) #define DISABLE_SSE() setcr4(CR4_DISABLE_SSE_FLAGS(getcr4())) #endif /* __xpv */ /* * Try and figure out what kind of FP capabilities we have, and * set up the control registers accordingly. */ void fpu_probe(void) { if (fpu_initial_probe() != 0) goto nofpu; if (fpu_exists == 0) { fpu_ignored = 1; goto nofpu; } #ifndef __xpv /* * Check and see if the fpu is present by looking * at the "extension type" bit. (While this used to * indicate a 387DX coprocessor in days gone by, * it's forced on by modern implementations for * compatibility.) */ if ((getcr0() & CR0_ET) == 0) goto nofpu; #endif /* Use the more complex exception clearing code if necessary */ if (cpuid_need_fp_excp_handling()) fpsave_ctxt = fpxsave_excp_clr_ctxt; /* * SSE and SSE2 are required for the 64-bit ABI. * * If they're not present, we can in principal run * 32-bit userland, though 64-bit processes will be hosed. * * (Perhaps we should complain more about this case!) */ if (is_x86_feature(x86_featureset, X86FSET_SSE) && is_x86_feature(x86_featureset, X86FSET_SSE2)) { fp_kind |= __FP_SSE; ENABLE_SSE(); if (is_x86_feature(x86_featureset, X86FSET_AVX)) { ASSERT(is_x86_feature(x86_featureset, X86FSET_XSAVE)); fp_kind |= __FP_AVX; } if (is_x86_feature(x86_featureset, X86FSET_XSAVE)) { fp_save_mech = FP_XSAVE; fp_elf = AT_386_FPINFO_XSAVE; if (is_x86_feature(x86_featureset, X86FSET_XSAVEOPT)) { /* * Use the more complex exception * clearing code if necessary. */ if (cpuid_need_fp_excp_handling()) { fpsave_ctxt = xsaveopt_excp_clr_ctxt; fp_elf = AT_386_FPINFO_XSAVE_AMD; } else { fpsave_ctxt = xsaveopt_ctxt; } xsavep = xsaveopt; } else { /* * Use the more complex exception * clearing code if necessary. */ if (cpuid_need_fp_excp_handling()) { fpsave_ctxt = xsave_excp_clr_ctxt; fp_elf = AT_386_FPINFO_XSAVE_AMD; } else { fpsave_ctxt = xsave_ctxt; } } fprestore_ctxt = xrestore_ctxt; fpsave_cachep = kmem_cache_create("xsave_cache", cpuid_get_xsave_size(), XSAVE_ALIGN, NULL, NULL, NULL, NULL, NULL, 0); } else { /* fp_save_mech defaults to FP_FXSAVE */ fpsave_cachep = kmem_cache_create("fxsave_cache", sizeof (struct fxsave_state), FXSAVE_ALIGN, NULL, NULL, NULL, NULL, NULL, 0); fp_elf = AT_386_FPINFO_FXSAVE; } } if (is_x86_feature(x86_featureset, X86FSET_SSE2)) { use_sse_pagecopy = use_sse_pagezero = use_sse_copy = 1; } if (fp_kind & __FP_SSE) { struct fxsave_state *fx; uint8_t fxsave_state[sizeof (struct fxsave_state) + XMM_ALIGN]; /* * Extract the mxcsr mask from our first fxsave */ fx = (void *)(((uintptr_t)(&fxsave_state[0]) + XMM_ALIGN) & ~(XMM_ALIGN - 1ul)); fx->fx_mxcsr_mask = 0; fxsave_insn(fx); if (fx->fx_mxcsr_mask != 0) { /* * Override default mask initialized in fpu.c */ sse_mxcsr_mask = fx->fx_mxcsr_mask; } } setcr0(CR0_ENABLE_FPU_FLAGS(getcr0())); return; /* * No FPU hardware present */ nofpu: setcr0(CR0_DISABLE_FPU_FLAGS(getcr0())); DISABLE_SSE(); fp_kind = FP_NO; fpu_exists = 0; }