/* SPDX-License-Identifier: MIT * * Permission is hereby granted, free of charge, to any person * obtaining a copy of this software and associated documentation * files (the "Software"), to deal in the Software without * restriction, including without limitation the rights to use, copy, * modify, merge, publish, distribute, sublicense, and/or sell copies * of the Software, and to permit persons to whom the Software is * furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be * included in all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE * SOFTWARE. * * Copyright: * 2020 Evan Nemerson */ #define SIMDE_TEST_X86_AVX512_INSN storeu #include #include static int test_simde_mm512_storeu_ps (SIMDE_MUNIT_TEST_ARGS) { #if 1 static const struct { const simde_float32 a[16]; const simde_float32 r[16]; } test_vec[] = { { { SIMDE_FLOAT32_C( 397.85), SIMDE_FLOAT32_C( 280.50), SIMDE_FLOAT32_C( -482.10), SIMDE_FLOAT32_C( -764.38), SIMDE_FLOAT32_C( 375.26), SIMDE_FLOAT32_C( -613.57), SIMDE_FLOAT32_C( 56.03), SIMDE_FLOAT32_C( 417.16), SIMDE_FLOAT32_C( -424.36), SIMDE_FLOAT32_C( 64.48), SIMDE_FLOAT32_C( 0.84), SIMDE_FLOAT32_C( 101.24), SIMDE_FLOAT32_C( -965.83), SIMDE_FLOAT32_C( 916.49), SIMDE_FLOAT32_C( 799.09), SIMDE_FLOAT32_C( 628.08) }, { SIMDE_FLOAT32_C( 397.85), SIMDE_FLOAT32_C( 280.50), SIMDE_FLOAT32_C( -482.10), SIMDE_FLOAT32_C( -764.38), SIMDE_FLOAT32_C( 375.26), SIMDE_FLOAT32_C( -613.57), SIMDE_FLOAT32_C( 56.03), SIMDE_FLOAT32_C( 417.16), SIMDE_FLOAT32_C( -424.36), SIMDE_FLOAT32_C( 64.48), SIMDE_FLOAT32_C( 0.84), SIMDE_FLOAT32_C( 101.24), SIMDE_FLOAT32_C( -965.83), SIMDE_FLOAT32_C( 916.49), SIMDE_FLOAT32_C( 799.09), SIMDE_FLOAT32_C( 628.08) } }, { { SIMDE_FLOAT32_C( -588.70), SIMDE_FLOAT32_C( 688.61), SIMDE_FLOAT32_C( 202.01), SIMDE_FLOAT32_C( -610.64), SIMDE_FLOAT32_C( 838.07), SIMDE_FLOAT32_C( -733.40), SIMDE_FLOAT32_C( -127.00), SIMDE_FLOAT32_C( 993.35), SIMDE_FLOAT32_C( -249.66), SIMDE_FLOAT32_C( -45.23), SIMDE_FLOAT32_C( 849.71), SIMDE_FLOAT32_C( -85.52), SIMDE_FLOAT32_C( 193.59), SIMDE_FLOAT32_C( -257.46), SIMDE_FLOAT32_C( 827.23), SIMDE_FLOAT32_C( -408.56) }, { SIMDE_FLOAT32_C( -588.70), SIMDE_FLOAT32_C( 688.61), SIMDE_FLOAT32_C( 202.01), SIMDE_FLOAT32_C( -610.64), SIMDE_FLOAT32_C( 838.07), SIMDE_FLOAT32_C( -733.40), SIMDE_FLOAT32_C( -127.00), SIMDE_FLOAT32_C( 993.35), SIMDE_FLOAT32_C( -249.66), SIMDE_FLOAT32_C( -45.23), SIMDE_FLOAT32_C( 849.71), SIMDE_FLOAT32_C( -85.52), SIMDE_FLOAT32_C( 193.59), SIMDE_FLOAT32_C( -257.46), SIMDE_FLOAT32_C( 827.23), SIMDE_FLOAT32_C( -408.56) } }, { { SIMDE_FLOAT32_C( -976.96), SIMDE_FLOAT32_C( -654.87), SIMDE_FLOAT32_C( -172.94), SIMDE_FLOAT32_C( 398.29), SIMDE_FLOAT32_C( -268.45), SIMDE_FLOAT32_C( 883.09), SIMDE_FLOAT32_C( -184.55), SIMDE_FLOAT32_C( 307.20), SIMDE_FLOAT32_C( -52.43), SIMDE_FLOAT32_C( 816.29), SIMDE_FLOAT32_C( -591.56), SIMDE_FLOAT32_C( -18.26), SIMDE_FLOAT32_C( 732.78), SIMDE_FLOAT32_C( -792.48), SIMDE_FLOAT32_C( -390.18), SIMDE_FLOAT32_C( -855.92) }, { SIMDE_FLOAT32_C( -976.96), SIMDE_FLOAT32_C( -654.87), SIMDE_FLOAT32_C( -172.94), SIMDE_FLOAT32_C( 398.29), SIMDE_FLOAT32_C( -268.45), SIMDE_FLOAT32_C( 883.09), SIMDE_FLOAT32_C( -184.55), SIMDE_FLOAT32_C( 307.20), SIMDE_FLOAT32_C( -52.43), SIMDE_FLOAT32_C( 816.29), SIMDE_FLOAT32_C( -591.56), SIMDE_FLOAT32_C( -18.26), SIMDE_FLOAT32_C( 732.78), SIMDE_FLOAT32_C( -792.48), SIMDE_FLOAT32_C( -390.18), SIMDE_FLOAT32_C( -855.92) } }, { { SIMDE_FLOAT32_C( 896.13), SIMDE_FLOAT32_C( 811.83), SIMDE_FLOAT32_C( -466.56), SIMDE_FLOAT32_C( 734.20), SIMDE_FLOAT32_C( -921.57), SIMDE_FLOAT32_C( 406.44), SIMDE_FLOAT32_C( 727.55), SIMDE_FLOAT32_C( -171.23), SIMDE_FLOAT32_C( -638.79), SIMDE_FLOAT32_C( 577.26), SIMDE_FLOAT32_C( 743.25), SIMDE_FLOAT32_C( 554.80), SIMDE_FLOAT32_C( -680.21), SIMDE_FLOAT32_C( 570.48), SIMDE_FLOAT32_C( -853.75), SIMDE_FLOAT32_C( -657.17) }, { SIMDE_FLOAT32_C( 896.13), SIMDE_FLOAT32_C( 811.83), SIMDE_FLOAT32_C( -466.56), SIMDE_FLOAT32_C( 734.20), SIMDE_FLOAT32_C( -921.57), SIMDE_FLOAT32_C( 406.44), SIMDE_FLOAT32_C( 727.55), SIMDE_FLOAT32_C( -171.23), SIMDE_FLOAT32_C( -638.79), SIMDE_FLOAT32_C( 577.26), SIMDE_FLOAT32_C( 743.25), SIMDE_FLOAT32_C( 554.80), SIMDE_FLOAT32_C( -680.21), SIMDE_FLOAT32_C( 570.48), SIMDE_FLOAT32_C( -853.75), SIMDE_FLOAT32_C( -657.17) } }, { { SIMDE_FLOAT32_C( 915.61), SIMDE_FLOAT32_C( -26.70), SIMDE_FLOAT32_C( 741.12), SIMDE_FLOAT32_C( -352.84), SIMDE_FLOAT32_C( -143.61), SIMDE_FLOAT32_C( -443.43), SIMDE_FLOAT32_C( 954.36), SIMDE_FLOAT32_C( 803.96), SIMDE_FLOAT32_C( -627.14), SIMDE_FLOAT32_C( -637.21), SIMDE_FLOAT32_C( -214.30), SIMDE_FLOAT32_C( -894.36), SIMDE_FLOAT32_C( -429.68), SIMDE_FLOAT32_C( 395.52), SIMDE_FLOAT32_C( -750.28), SIMDE_FLOAT32_C( -533.55) }, { SIMDE_FLOAT32_C( 915.61), SIMDE_FLOAT32_C( -26.70), SIMDE_FLOAT32_C( 741.12), SIMDE_FLOAT32_C( -352.84), SIMDE_FLOAT32_C( -143.61), SIMDE_FLOAT32_C( -443.43), SIMDE_FLOAT32_C( 954.36), SIMDE_FLOAT32_C( 803.96), SIMDE_FLOAT32_C( -627.14), SIMDE_FLOAT32_C( -637.21), SIMDE_FLOAT32_C( -214.30), SIMDE_FLOAT32_C( -894.36), SIMDE_FLOAT32_C( -429.68), SIMDE_FLOAT32_C( 395.52), SIMDE_FLOAT32_C( -750.28), SIMDE_FLOAT32_C( -533.55) } }, { { SIMDE_FLOAT32_C( 207.35), SIMDE_FLOAT32_C( -216.84), SIMDE_FLOAT32_C( -799.36), SIMDE_FLOAT32_C( 285.78), SIMDE_FLOAT32_C( -810.40), SIMDE_FLOAT32_C( 928.19), SIMDE_FLOAT32_C( -885.45), SIMDE_FLOAT32_C( -449.19), SIMDE_FLOAT32_C( 505.45), SIMDE_FLOAT32_C( 857.81), SIMDE_FLOAT32_C( -894.39), SIMDE_FLOAT32_C( 825.24), SIMDE_FLOAT32_C( 428.29), SIMDE_FLOAT32_C( -748.14), SIMDE_FLOAT32_C( -831.93), SIMDE_FLOAT32_C( 343.89) }, { SIMDE_FLOAT32_C( 207.35), SIMDE_FLOAT32_C( -216.84), SIMDE_FLOAT32_C( -799.36), SIMDE_FLOAT32_C( 285.78), SIMDE_FLOAT32_C( -810.40), SIMDE_FLOAT32_C( 928.19), SIMDE_FLOAT32_C( -885.45), SIMDE_FLOAT32_C( -449.19), SIMDE_FLOAT32_C( 505.45), SIMDE_FLOAT32_C( 857.81), SIMDE_FLOAT32_C( -894.39), SIMDE_FLOAT32_C( 825.24), SIMDE_FLOAT32_C( 428.29), SIMDE_FLOAT32_C( -748.14), SIMDE_FLOAT32_C( -831.93), SIMDE_FLOAT32_C( 343.89) } }, { { SIMDE_FLOAT32_C( 225.16), SIMDE_FLOAT32_C( 909.19), SIMDE_FLOAT32_C( 991.05), SIMDE_FLOAT32_C( -918.45), SIMDE_FLOAT32_C( -534.23), SIMDE_FLOAT32_C( 945.41), SIMDE_FLOAT32_C( 885.51), SIMDE_FLOAT32_C( -161.37), SIMDE_FLOAT32_C( -691.80), SIMDE_FLOAT32_C( -328.80), SIMDE_FLOAT32_C( -55.73), SIMDE_FLOAT32_C( -121.48), SIMDE_FLOAT32_C( -933.28), SIMDE_FLOAT32_C( 193.99), SIMDE_FLOAT32_C( 344.96), SIMDE_FLOAT32_C( 274.08) }, { SIMDE_FLOAT32_C( 225.16), SIMDE_FLOAT32_C( 909.19), SIMDE_FLOAT32_C( 991.05), SIMDE_FLOAT32_C( -918.45), SIMDE_FLOAT32_C( -534.23), SIMDE_FLOAT32_C( 945.41), SIMDE_FLOAT32_C( 885.51), SIMDE_FLOAT32_C( -161.37), SIMDE_FLOAT32_C( -691.80), SIMDE_FLOAT32_C( -328.80), SIMDE_FLOAT32_C( -55.73), SIMDE_FLOAT32_C( -121.48), SIMDE_FLOAT32_C( -933.28), SIMDE_FLOAT32_C( 193.99), SIMDE_FLOAT32_C( 344.96), SIMDE_FLOAT32_C( 274.08) } }, { { SIMDE_FLOAT32_C( 977.14), SIMDE_FLOAT32_C( 545.61), SIMDE_FLOAT32_C( -440.14), SIMDE_FLOAT32_C( -833.26), SIMDE_FLOAT32_C( 473.80), SIMDE_FLOAT32_C( -325.59), SIMDE_FLOAT32_C( -282.45), SIMDE_FLOAT32_C( -20.75), SIMDE_FLOAT32_C( -467.78), SIMDE_FLOAT32_C( -176.84), SIMDE_FLOAT32_C( -195.51), SIMDE_FLOAT32_C( 960.51), SIMDE_FLOAT32_C( 75.02), SIMDE_FLOAT32_C( -27.44), SIMDE_FLOAT32_C( 304.40), SIMDE_FLOAT32_C( -699.82) }, { SIMDE_FLOAT32_C( 977.14), SIMDE_FLOAT32_C( 545.61), SIMDE_FLOAT32_C( -440.14), SIMDE_FLOAT32_C( -833.26), SIMDE_FLOAT32_C( 473.80), SIMDE_FLOAT32_C( -325.59), SIMDE_FLOAT32_C( -282.45), SIMDE_FLOAT32_C( -20.75), SIMDE_FLOAT32_C( -467.78), SIMDE_FLOAT32_C( -176.84), SIMDE_FLOAT32_C( -195.51), SIMDE_FLOAT32_C( 960.51), SIMDE_FLOAT32_C( 75.02), SIMDE_FLOAT32_C( -27.44), SIMDE_FLOAT32_C( 304.40), SIMDE_FLOAT32_C( -699.82) } } }; for (size_t i = 0 ; i < (sizeof(test_vec) / sizeof(test_vec[0])) ; i++) { simde__m512 a = simde_mm512_loadu_ps(test_vec[i].a); simde_float32 r[sizeof(simde__m512) / sizeof(simde_float32)]; simde_mm512_storeu_ps(r, a); simde_assert_equal_vf32(sizeof(r) / sizeof(r[0]), r, test_vec[i].r, 1); } return 0; #else fputc('\n', stdout); for (int i = 0 ; i < 8 ; i++) { simde__m512 a = simde_test_x86_random_f32x16(SIMDE_FLOAT32_C(-1000.0), SIMDE_FLOAT32_C(1000.0)); simde_float32 r[sizeof(simde__m512) / sizeof(simde_float32)]; simde_mm512_storeu_ps(r, a); simde_test_x86_write_f32x16(2, a, SIMDE_TEST_VEC_POS_FIRST); simde_test_codegen_write_vf32(2, sizeof(r) / sizeof(r[0]), r, SIMDE_TEST_VEC_POS_LAST); } return 1; #endif } SIMDE_TEST_FUNC_LIST_BEGIN SIMDE_TEST_FUNC_LIST_ENTRY(mm512_storeu_ps) SIMDE_TEST_FUNC_LIST_END #include