Training courses

Kernel and Embedded Linux

Bootlin training courses

Embedded Linux, kernel,
Yocto Project, Buildroot, real-time,
graphics, boot time, debugging...

Bootlin logo

Elixir Cross Referencer

/*	$NetBSD: t_convert_xmm_s87.c,v 1.1 2020/10/15 17:44:44 mgorny Exp $	*/

/*-
 * Copyright (c) 2020 The NetBSD Foundation, Inc.
 * All rights reserved.
 *
 * This code is derived from software contributed to The NetBSD Foundation
 * by Michał Górny for Moritz Systems Technology Company Sp. z o.o.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
 * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */
#include <sys/cdefs.h>
__RCSID("$NetBSD: t_convert_xmm_s87.c,v 1.1 2020/10/15 17:44:44 mgorny Exp $");

#include <sys/types.h>
#include <sys/param.h>
#include <sys/sysctl.h>
#include <x86/cpu.h>
#include <x86/cpu_extended_state.h>

#include <stdint.h>
#include <string.h>

#include <atf-c.h>

#include "arch/x86/x86/convert_xmm_s87.c"

static const struct fpaccfx ST_INPUTS[] = {
	{{0x8000000000000000, 0x4000}}, /* +2.0 */
	{{0x3f00000000000000, 0x0000}}, /* 1.654785e-4932 */
	{{0x0000000000000000, 0x0000}}, /* +0 */
	{{0x0000000000000000, 0x8000}}, /* -0 */
	{{0x8000000000000000, 0x7fff}}, /* +inf */
	{{0x8000000000000000, 0xffff}}, /* -inf */
	{{0xc000000000000000, 0xffff}}, /* nan */
	{{0x8000000000000000, 0xc000}}, /* -2.0 */
};
__CTASSERT(sizeof(*ST_INPUTS) == 16);

ATF_TC(fsave_fxsave_hw);
ATF_TC_HEAD(fsave_fxsave_hw, tc)
{
	atf_tc_set_md_var(tc, "descr",
	    "converting between FSAVE/FXSAVE comparing to actual results");
}

ATF_TC_BODY(fsave_fxsave_hw, tc)
{
	struct save87 fsave, fsave_conv;
	struct fxsave fxsave, fxsave_conv;
	int i, j;

	int mib[] = { CTL_MACHDEP, CPU_OSFXSR };
	int has_fxsave;
	size_t has_fxsave_size = sizeof(has_fxsave);
	if (sysctl(mib, __arraycount(mib), &has_fxsave, &has_fxsave_size,
	    NULL, 0) == -1 || !has_fxsave)
		atf_tc_skip("FXSAVE not supported");

	for (i = 1; i <= __arraycount(ST_INPUTS); i++) {
		unsigned long unused1, unused2;
		__asm__ __volatile__(
			"finit\n"
			".loadfp:\n\t"
			"fldt (%2)\n\t"
			"add $0x10, %2\n\t"
			"loop .loadfp\n\t"
			"fxsave %5\n\t"
			"fsave %4\n\t"
			: "=b"(unused1), "=c"(unused2)
			: "b"(ST_INPUTS), "c"(i), "m"(fsave), "m"(fxsave)
			: "st"
		);

		/* Self-assertion for working FSAVE/FXSAVE */
		ATF_REQUIRE_EQ(fsave.s87_cw, fxsave.fx_cw);
		ATF_REQUIRE_EQ(fsave.s87_sw, fxsave.fx_sw);

		/* Test process_xmm_to_s87() */
		process_xmm_to_s87(&fxsave, &fsave_conv);
		ATF_CHECK_EQ(fsave_conv.s87_cw, fsave.s87_cw);
		ATF_CHECK_EQ(fsave_conv.s87_sw, fsave.s87_sw);
		ATF_CHECK_EQ(fsave_conv.s87_tw, fsave.s87_tw);
		for (j = 0; j < i; j++) {
			ATF_CHECK_EQ(fsave_conv.s87_ac[j].f87_exp_sign,
			    fsave.s87_ac[j].f87_exp_sign);
			ATF_CHECK_EQ(fsave_conv.s87_ac[j].f87_mantissa,
			    fsave.s87_ac[j].f87_mantissa);
		}

		/* Test process_s87_to_xmm() */
		process_s87_to_xmm(&fsave, &fxsave_conv);
		ATF_CHECK_EQ(fxsave_conv.fx_cw, fxsave.fx_cw);
		ATF_CHECK_EQ(fxsave_conv.fx_sw, fxsave.fx_sw);
		ATF_CHECK_EQ(fxsave_conv.fx_tw, fxsave.fx_tw);
		for (j = 0; j < i; j++) {
			ATF_CHECK_EQ(fxsave_conv.fx_87_ac[j].r.f87_exp_sign,
			    fxsave.fx_87_ac[j].r.f87_exp_sign);
			ATF_CHECK_EQ(fxsave_conv.fx_87_ac[j].r.f87_mantissa,
			    fxsave.fx_87_ac[j].r.f87_mantissa);
		}
	}
}

struct s87_xmm_test_vector {
	uint16_t sw;
	uint16_t tw;
	uint8_t tw_abridged;
};

struct s87_xmm_test_vector FIXED_TEST_VECTORS[] = {
	{0x3800, 0x3fff, 0x80},
	{0x3000, 0x2fff, 0xc0},
	{0x2800, 0x27ff, 0xe0},
	{0x2000, 0x25ff, 0xf0},
	{0x1800, 0x25bf, 0xf8},
	{0x1000, 0x25af, 0xfc},
	{0x0800, 0x25ab, 0xfe},
	{0x0000, 0x25a8, 0xff},
};

ATF_TC(s87_to_xmm);
ATF_TC_HEAD(s87_to_xmm, tc)
{
	atf_tc_set_md_var(tc, "descr",
	    "converting from FSAVE to FXSAVE using fixed test vectors");
}

ATF_TC_BODY(s87_to_xmm, tc)
{
	struct save87 fsave;
	struct fxsave fxsave;
	int i, j;

	memset(&fsave, 0, sizeof(fsave));
	for (i = 0; i < __arraycount(ST_INPUTS); i++) {
		fsave.s87_sw = FIXED_TEST_VECTORS[i].sw;
		fsave.s87_tw = FIXED_TEST_VECTORS[i].tw;
		for (j = 0; j <= i; j++)
			fsave.s87_ac[i - j] = ST_INPUTS[j].r;

		process_s87_to_xmm(&fsave, &fxsave);
		ATF_CHECK_EQ(fxsave.fx_sw, FIXED_TEST_VECTORS[i].sw);
		ATF_CHECK_EQ(fxsave.fx_tw, FIXED_TEST_VECTORS[i].tw_abridged);
		for (j = 0; j < i; j++) {
			ATF_CHECK_EQ(fxsave.fx_87_ac[i - j].r.f87_exp_sign,
			    ST_INPUTS[j].r.f87_exp_sign);
			ATF_CHECK_EQ(fxsave.fx_87_ac[i - j].r.f87_mantissa,
			    ST_INPUTS[j].r.f87_mantissa);
		}
	}
}

ATF_TC(xmm_to_s87);
ATF_TC_HEAD(xmm_to_s87, tc)
{
	atf_tc_set_md_var(tc, "descr",
	    "converting from FSAVE to FXSAVE using fixed test vectors");
}

ATF_TC_BODY(xmm_to_s87, tc)
{
	struct save87 fsave;
	struct fxsave fxsave;
	int i, j;

	memset(&fxsave, 0, sizeof(fxsave));
	for (i = 0; i < __arraycount(ST_INPUTS); i++) {
		fxsave.fx_sw = FIXED_TEST_VECTORS[i].sw;
		fxsave.fx_tw = FIXED_TEST_VECTORS[i].tw_abridged;
		for (j = 0; j <= i; j++)
			fxsave.fx_87_ac[i - j] = ST_INPUTS[j];

		process_xmm_to_s87(&fxsave, &fsave);
		ATF_CHECK_EQ(fsave.s87_sw, FIXED_TEST_VECTORS[i].sw);
		ATF_CHECK_EQ(fsave.s87_tw, FIXED_TEST_VECTORS[i].tw);
		for (j = 0; j < i; j++) {
			ATF_CHECK_EQ(fsave.s87_ac[i - j].f87_exp_sign,
			    ST_INPUTS[j].r.f87_exp_sign);
			ATF_CHECK_EQ(fsave.s87_ac[i - j].f87_mantissa,
			    ST_INPUTS[j].r.f87_mantissa);
		}
	}
}

ATF_TP_ADD_TCS(tp)
{
	ATF_TP_ADD_TC(tp, fsave_fxsave_hw);
	ATF_TP_ADD_TC(tp, s87_to_xmm);
	ATF_TP_ADD_TC(tp, xmm_to_s87);
	return atf_no_error();
}