#include "head.c" #include "QF/mathlib.h" #define sq(x) ((float)(x)*(float)(x)) static pr_vec4_t float_binop_init[] = { { 5, -5, 5, -5}, { 3, 3, -3, -3}, { 0, 0, 0, 0}, { 0, 0, 0, 0}, { 0, 0, 0, 0}, { 0, 0, 0, 0}, { 0, 0, 0, 0}, { 0, 0, 0, 0}, }; static pr_vec4_t float_binop_expect[] = { { 5, -5, 5, -5}, { 3, 3, -3, -3}, { 15, -15, -15, 15}, { 1.666666627, -1.666666627, -1.666666627, 1.666666627}, { 2, -2, 2, -2}, { 2, 1, -1, -2}, { 8, -2, 2, -8}, { 2, -8, 8, -2}, }; static dstatement_t float_binop_1_statements[] = { { OP(0, 0, 0, OP_LEA_A), 4, 0, 32 }, // init index //loop: { OP(0, 0, 0, OP_LEA_C), 32, -1, 32 }, // dec index { OP(0, 0, 0, OP_IFAE), 2, 0, 32 }, { OP(0, 0, 0, OP_BREAK), 0, 0, 0 }, { OP(0, 0, 0, OP_WITH), 4, 32, 1 }, { OP(1, 1, 1, OP_MUL_F_1), 0, 4, 8 }, { OP(1, 1, 1, OP_DIV_F_1), 0, 4, 12 }, { OP(1, 1, 1, OP_REM_F_1), 0, 4, 16 }, { OP(1, 1, 1, OP_MOD_F_1), 0, 4, 20 }, { OP(1, 1, 1, OP_ADD_F_1), 0, 4, 24 }, { OP(1, 1, 1, OP_SUB_F_1), 0, 4, 28 }, { OP(1, 1, 1, OP_JUMP_A), -10, 0, 0 }, }; static dstatement_t float_binop_2_statements[] = { { OP(0, 0, 0, OP_LEA_A), 4, 0, 32 }, // index //loop: { OP(0, 0, 0, OP_LEA_C), 32, -2, 32 }, // dec index { OP(0, 0, 0, OP_IFAE), 2, 0, 32 }, { OP(0, 0, 0, OP_BREAK), 0, 0, 0 }, { OP(0, 0, 0, OP_WITH), 4, 32, 1 }, { OP(1, 1, 1, OP_MUL_F_2), 0, 4, 8 }, { OP(1, 1, 1, OP_DIV_F_2), 0, 4, 12 }, { OP(1, 1, 1, OP_REM_F_2), 0, 4, 16 }, { OP(1, 1, 1, OP_MOD_F_2), 0, 4, 20 }, { OP(1, 1, 1, OP_ADD_F_2), 0, 4, 24 }, { OP(1, 1, 1, OP_SUB_F_2), 0, 4, 28 }, { OP(1, 1, 1, OP_JUMP_A), -10, 0, 0 }, }; static dstatement_t float_binop_3a_statements[] = { { OP(1, 1, 1, OP_MUL_F_3), 0, 4, 8 }, { OP(1, 1, 1, OP_MUL_F_1), 3, 7, 11 }, { OP(1, 1, 1, OP_DIV_F_3), 0, 4, 12 }, { OP(1, 1, 1, OP_DIV_F_1), 3, 7, 15 }, { OP(1, 1, 1, OP_REM_F_3), 0, 4, 16 }, { OP(1, 1, 1, OP_REM_F_1), 3, 7, 19 }, { OP(1, 1, 1, OP_MOD_F_3), 0, 4, 20 }, { OP(1, 1, 1, OP_MOD_F_1), 3, 7, 23 }, { OP(1, 1, 1, OP_ADD_F_3), 0, 4, 24 }, { OP(1, 1, 1, OP_ADD_F_1), 3, 7, 27 }, { OP(1, 1, 1, OP_SUB_F_3), 0, 4, 28 }, { OP(1, 1, 1, OP_SUB_F_1), 3, 7, 31 }, }; static dstatement_t float_binop_3b_statements[] = { { OP(1, 1, 1, OP_MUL_F_1), 0, 4, 8 }, { OP(1, 1, 1, OP_MUL_F_3), 1, 5, 9 }, { OP(1, 1, 1, OP_DIV_F_1), 0, 4, 12 }, { OP(1, 1, 1, OP_DIV_F_3), 1, 5, 13 }, { OP(1, 1, 1, OP_REM_F_1), 0, 4, 16 }, { OP(1, 1, 1, OP_REM_F_3), 1, 5, 17 }, { OP(1, 1, 1, OP_MOD_F_1), 0, 4, 20 }, { OP(1, 1, 1, OP_MOD_F_3), 1, 5, 21 }, { OP(1, 1, 1, OP_ADD_F_1), 0, 4, 24 }, { OP(1, 1, 1, OP_ADD_F_3), 1, 5, 25 }, { OP(1, 1, 1, OP_SUB_F_1), 0, 4, 28 }, { OP(1, 1, 1, OP_SUB_F_3), 1, 5, 29 }, }; static dstatement_t float_binop_4_statements[] = { { OP(1, 1, 1, OP_MUL_F_4), 0, 4, 8 }, { OP(1, 1, 1, OP_DIV_F_4), 0, 4, 12 }, { OP(1, 1, 1, OP_REM_F_4), 0, 4, 16 }, { OP(1, 1, 1, OP_MOD_F_4), 0, 4, 20 }, { OP(1, 1, 1, OP_ADD_F_4), 0, 4, 24 }, { OP(1, 1, 1, OP_SUB_F_4), 0, 4, 28 }, }; static pr_vec4_t float_cossin_init[] = { { 1, 2, 3, 4 }, // 0: output { M_PI/6, 0, 0, 0 }, // 4: x { 1, 2, 0, 0 }, // 8: f { 1, 1, 0, 25 }, // 12: f inc and f0 max { 0, 0, 0, 0 }, // 16: x2 -> [xx, xx] // { } // 20: xn }; static pr_vec4_t float_cossin_expect[] = { { 0.866025388, 0.5, 0, 0 }, // 0: output { M_PI/6, 0, 0, 0 }, // 4: x { 25, 26, 0, 0 }, // 8: f { 1, 1, 0, 25 }, // 12: f inc and f0 max { -sq(M_PI/6), -sq(M_PI/6), 0, 0 }, // 16: x2 -> [xx, xx] }; static dstatement_t float_cossin_statements[] = { { OP(0, 0, 0, OP_STORE_A_1), 21, 0, 4 }, // init xn -> [?, x] { OP(0, 0, 0, OP_STORE_A_1), 20, 0, 8 }, // init xn -> [1, x] { OP(0, 0, 0, OP_SWIZZLE_F_4), 4, 0xc000, 16 },// init x2 -> [x, x, 0, 0] { OP(0, 0, 0, OP_MUL_F_2), 16, 16, 16 }, // x2 -> [x*x, x*x, 0, 0] { OP(0, 0, 0, OP_SWIZZLE_F_4), 16, 0xc3e4, 16 },// init x2 -> -x2 { OP(0, 0, 0, OP_SUB_F_4), 0, 0, 0 }, // init acc (output) to 0 // loop: { OP(0, 0, 0, OP_ADD_F_2), 0, 20, 0 }, // acc += xn { OP(0, 0, 0, OP_MUL_F_2), 20, 16, 20 }, // xn *= x2 { OP(0, 0, 0, OP_DIV_F_2), 20, 8, 20 }, // xn /= f { OP(0, 0, 0, OP_ADD_F_2), 8, 12, 8 }, // f += inc { OP(0, 0, 0, OP_DIV_F_2), 20, 8, 20 }, // xn /= f { OP(0, 0, 0, OP_ADD_F_2), 8, 12, 8 }, // f += inc { OP(0, 0, 0, OP_LT_F_1), 8, 15, 23 }, // f0 < fmax { OP(0, 0, 0, OP_IFNZ), -7, 0, 23 }, // f0 < fmax }; static pr_vec4_t float_cmpop_init[] = { { 5, -5, 5, -5}, { 5, 5, -5, -5}, { 0, 0, 0, 0}, { 0, 0, 0, 0}, { 0, 0, 0, 0}, { 0, 0, 0, 0}, { 0, 0, 0, 0}, { 0, 0, 0, 0}, }; // 5.0 as 32-bit int #define F 0x40a00000 #define mF 0xc0a00000 static pr_ivec4_t float_cmpop_expect[] = { { F, mF, F, mF}, { F, F, mF, mF}, { -1, 0, 0, -1}, { 0, -1, 0, 0}, { 0, 0, -1, 0}, { 0, -1, -1, 0}, { -1, 0, -1, -1}, { -1, -1, 0, -1}, }; static dstatement_t float_cmpop_1_statements[] = { { OP(0, 0, 0, OP_LEA_A), 4, 0, 32 }, // init index //loop: { OP(0, 0, 0, OP_LEA_C), 32, -1, 32 }, // dec index { OP(0, 0, 0, OP_IFAE), 2, 0, 32 }, { OP(0, 0, 0, OP_BREAK), 0, 0, 0 }, { OP(0, 0, 0, OP_WITH), 4, 32, 1 }, { OP(1, 1, 1, OP_EQ_F_1), 0, 4, 8 }, { OP(1, 1, 1, OP_LT_F_1), 0, 4, 12 }, { OP(1, 1, 1, OP_GT_F_1), 0, 4, 16 }, { OP(1, 1, 1, OP_NE_F_1), 0, 4, 20 }, { OP(1, 1, 1, OP_GE_F_1), 0, 4, 24 }, { OP(1, 1, 1, OP_LE_F_1), 0, 4, 28 }, { OP(1, 1, 1, OP_JUMP_A), -10, 0, 0 }, }; static dstatement_t float_cmpop_2_statements[] = { { OP(0, 0, 0, OP_LEA_A), 4, 0, 32 }, // index //loop: { OP(0, 0, 0, OP_LEA_C), 32, -2, 32 }, // dec index { OP(0, 0, 0, OP_IFAE), 2, 0, 32 }, { OP(0, 0, 0, OP_BREAK), 0, 0, 0 }, { OP(0, 0, 0, OP_WITH), 4, 32, 1 }, { OP(1, 1, 1, OP_EQ_F_2), 0, 4, 8 }, { OP(1, 1, 1, OP_LT_F_2), 0, 4, 12 }, { OP(1, 1, 1, OP_GT_F_2), 0, 4, 16 }, { OP(1, 1, 1, OP_NE_F_2), 0, 4, 20 }, { OP(1, 1, 1, OP_GE_F_2), 0, 4, 24 }, { OP(1, 1, 1, OP_LE_F_2), 0, 4, 28 }, { OP(1, 1, 1, OP_JUMP_A), -10, 0, 0 }, }; static dstatement_t float_cmpop_3a_statements[] = { { OP(1, 1, 1, OP_EQ_F_3), 0, 4, 8 }, { OP(1, 1, 1, OP_EQ_F_1), 3, 7, 11 }, { OP(1, 1, 1, OP_LT_F_3), 0, 4, 12 }, { OP(1, 1, 1, OP_LT_F_1), 3, 7, 15 }, { OP(1, 1, 1, OP_GT_F_3), 0, 4, 16 }, { OP(1, 1, 1, OP_GT_F_1), 3, 7, 19 }, { OP(1, 1, 1, OP_NE_F_3), 0, 4, 20 }, { OP(1, 1, 1, OP_NE_F_1), 3, 7, 23 }, { OP(1, 1, 1, OP_GE_F_3), 0, 4, 24 }, { OP(1, 1, 1, OP_GE_F_1), 3, 7, 27 }, { OP(1, 1, 1, OP_LE_F_3), 0, 4, 28 }, { OP(1, 1, 1, OP_LE_F_1), 3, 7, 31 }, }; static dstatement_t float_cmpop_3b_statements[] = { { OP(1, 1, 1, OP_EQ_F_1), 0, 4, 8 }, { OP(1, 1, 1, OP_EQ_F_3), 1, 5, 9 }, { OP(1, 1, 1, OP_LT_F_1), 0, 4, 12 }, { OP(1, 1, 1, OP_LT_F_3), 1, 5, 13 }, { OP(1, 1, 1, OP_GT_F_1), 0, 4, 16 }, { OP(1, 1, 1, OP_GT_F_3), 1, 5, 17 }, { OP(1, 1, 1, OP_NE_F_1), 0, 4, 20 }, { OP(1, 1, 1, OP_NE_F_3), 1, 5, 21 }, { OP(1, 1, 1, OP_GE_F_1), 0, 4, 24 }, { OP(1, 1, 1, OP_GE_F_3), 1, 5, 25 }, { OP(1, 1, 1, OP_LE_F_1), 0, 4, 28 }, { OP(1, 1, 1, OP_LE_F_3), 1, 5, 29 }, }; static dstatement_t float_cmpop_4_statements[] = { { OP(1, 1, 1, OP_EQ_F_4), 0, 4, 8 }, { OP(1, 1, 1, OP_LT_F_4), 0, 4, 12 }, { OP(1, 1, 1, OP_GT_F_4), 0, 4, 16 }, { OP(1, 1, 1, OP_NE_F_4), 0, 4, 20 }, { OP(1, 1, 1, OP_GE_F_4), 0, 4, 24 }, { OP(1, 1, 1, OP_LE_F_4), 0, 4, 28 }, }; test_t tests[] = { { .desc = "float binop 1", .extra_globals = 4 * 1, .num_globals = num_globals(float_binop_init,float_binop_expect), .num_statements = num_statements (float_binop_1_statements), .statements = float_binop_1_statements, .init_globals = (pr_int_t *) float_binop_init, .expect_globals = (pr_int_t *) float_binop_expect, }, { .desc = "float binop 2", .extra_globals = 4 * 1, .num_globals = num_globals(float_binop_init,float_binop_expect), .num_statements = num_statements (float_binop_2_statements), .statements = float_binop_2_statements, .init_globals = (pr_int_t *) float_binop_init, .expect_globals = (pr_int_t *) float_binop_expect, }, { .desc = "float binop 3a", .extra_globals = 4 * 1, .num_globals = num_globals(float_binop_init,float_binop_expect), .num_statements = num_statements (float_binop_3a_statements), .statements = float_binop_3a_statements, .init_globals = (pr_int_t *) float_binop_init, .expect_globals = (pr_int_t *) float_binop_expect, }, { .desc = "float binop 3b", .extra_globals = 4 * 1, .num_globals = num_globals(float_binop_init,float_binop_expect), .num_statements = num_statements (float_binop_3b_statements), .statements = float_binop_3b_statements, .init_globals = (pr_int_t *) float_binop_init, .expect_globals = (pr_int_t *) float_binop_expect, }, { .desc = "float binop 4", .extra_globals = 4 * 1, .num_globals = num_globals(float_binop_init,float_binop_expect), .num_statements = num_statements (float_binop_4_statements), .statements = float_binop_4_statements, .init_globals = (pr_int_t *) float_binop_init, .expect_globals = (pr_int_t *) float_binop_expect, }, { .desc = "float cos sin", .extra_globals = 4 * 1, .num_globals = num_globals (float_cossin_init, float_cossin_expect), .num_statements = num_statements (float_cossin_statements), .statements = float_cossin_statements, .init_globals = (pr_int_t *) float_cossin_init, .expect_globals = (pr_int_t *) float_cossin_expect, }, { .desc = "float cmpop 1", .extra_globals = 4 * 1, .num_globals = num_globals(float_cmpop_init,float_cmpop_expect), .num_statements = num_statements (float_cmpop_1_statements), .statements = float_cmpop_1_statements, .init_globals = (pr_int_t *) float_cmpop_init, .expect_globals = (pr_int_t *) float_cmpop_expect, }, { .desc = "float cmpop 2", .extra_globals = 4 * 1, .num_globals = num_globals(float_cmpop_init,float_cmpop_expect), .num_statements = num_statements (float_cmpop_2_statements), .statements = float_cmpop_2_statements, .init_globals = (pr_int_t *) float_cmpop_init, .expect_globals = (pr_int_t *) float_cmpop_expect, }, { .desc = "float cmpop 3a", .extra_globals = 4 * 1, .num_globals = num_globals(float_cmpop_init,float_cmpop_expect), .num_statements = num_statements (float_cmpop_3a_statements), .statements = float_cmpop_3a_statements, .init_globals = (pr_int_t *) float_cmpop_init, .expect_globals = (pr_int_t *) float_cmpop_expect, }, { .desc = "float cmpop 3b", .extra_globals = 4 * 1, .num_globals = num_globals(float_cmpop_init,float_cmpop_expect), .num_statements = num_statements (float_cmpop_3b_statements), .statements = float_cmpop_3b_statements, .init_globals = (pr_int_t *) float_cmpop_init, .expect_globals = (pr_int_t *) float_cmpop_expect, }, { .desc = "float cmpop 4", .extra_globals = 4 * 1, .num_globals = num_globals(float_cmpop_init,float_cmpop_expect), .num_statements = num_statements (float_cmpop_4_statements), .statements = float_cmpop_4_statements, .init_globals = (pr_int_t *) float_cmpop_init, .expect_globals = (pr_int_t *) float_cmpop_expect, }, }; #include "main.c"