| @@ -20,75 +20,154 @@ | |||||
| using namespace std; | using namespace std; | ||||
| using namespace lol; | using namespace lol; | ||||
| static size_t const MATRIX_TABLE_SIZE = 64 * 1024; | |||||
| static size_t const MATRIX_RUNS = 100; | |||||
| static size_t const HALF_TABLE_SIZE = 1024 * 1024; | static size_t const HALF_TABLE_SIZE = 1024 * 1024; | ||||
| static size_t const HALF_RUNS = 100; | |||||
| static size_t const HALF_RUNS = 50; | |||||
| static void bench_matrix(int mode); | |||||
| static void bench_half(int mode); | static void bench_half(int mode); | ||||
| int main(int argc, char **argv) | int main(int argc, char **argv) | ||||
| { | { | ||||
| Log::Info("-----------------------------------\n"); | |||||
| Log::Info("Half precision floats (random bits)\n"); | |||||
| Log::Info("-----------------------------------\n"); | |||||
| Log::Info("----------------------------\n"); | |||||
| Log::Info(" Float matrices [-2.0, 2.0]\n"); | |||||
| Log::Info("----------------------------\n"); | |||||
| bench_matrix(1); | |||||
| Log::Info("-------------------------------------\n"); | |||||
| Log::Info(" Half precision floats (random bits)\n"); | |||||
| Log::Info("-------------------------------------\n"); | |||||
| bench_half(1); | bench_half(1); | ||||
| Log::Info("---------------------------------\n"); | |||||
| Log::Info("Half precision floats [-2.0, 2.0]\n"); | |||||
| Log::Info("---------------------------------\n"); | |||||
| Log::Info("-----------------------------------\n"); | |||||
| Log::Info(" Half precision floats [-2.0, 2.0]\n"); | |||||
| Log::Info("-----------------------------------\n"); | |||||
| bench_half(2); | bench_half(2); | ||||
| return EXIT_SUCCESS; | return EXIT_SUCCESS; | ||||
| } | } | ||||
| static void bench_half(int mode) | |||||
| static void bench_matrix(int mode) | |||||
| { | { | ||||
| float result[8] = { 0.0f }; | |||||
| float result[5] = { 0.0f }; | |||||
| Timer timer; | Timer timer; | ||||
| /* Set up tables */ | /* Set up tables */ | ||||
| float *pf = new float[HALF_TABLE_SIZE]; | |||||
| half *ph = new half[HALF_TABLE_SIZE]; | |||||
| mat4 *pm = new mat4[MATRIX_TABLE_SIZE + 1]; | |||||
| float *pf = new float[MATRIX_TABLE_SIZE]; | |||||
| switch (mode) | |||||
| for (size_t run = 0; run < MATRIX_RUNS; run++) | |||||
| { | { | ||||
| case 1: | |||||
| for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | |||||
| ph[i] = half::makebits(rand()); | |||||
| break; | |||||
| case 2: | |||||
| for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | |||||
| ph[i] = RandF(-2.0f, 2.0f); | |||||
| break; | |||||
| switch (mode) | |||||
| { | |||||
| case 1: | |||||
| for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++) | |||||
| for (int j = 0; j < 4; j++) | |||||
| for (int k = 0; k < 4; k++) | |||||
| pm[i][j][k] = RandF(-2.0f, 2.0f); | |||||
| break; | |||||
| } | |||||
| /* Copy matrices */ | |||||
| timer.GetMs(); | |||||
| for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++) | |||||
| pm[i] = pm[i + 1]; | |||||
| result[0] += timer.GetMs(); | |||||
| /* Determinant */ | |||||
| timer.GetMs(); | |||||
| for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++) | |||||
| pf[i] = pm[i].det(); | |||||
| result[1] += timer.GetMs(); | |||||
| /* Multiply matrices */ | |||||
| timer.GetMs(); | |||||
| for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++) | |||||
| pm[i] *= pm[i + 1]; | |||||
| result[2] += timer.GetMs(); | |||||
| /* Add matrices */ | |||||
| timer.GetMs(); | |||||
| for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++) | |||||
| pm[i] += pm[i + 1]; | |||||
| result[3] += timer.GetMs(); | |||||
| /* Invert matrix */ | |||||
| timer.GetMs(); | |||||
| for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++) | |||||
| pm[i] = pm[i].invert(); | |||||
| result[4] += timer.GetMs(); | |||||
| } | } | ||||
| delete[] pm; | |||||
| delete[] pf; | |||||
| for (size_t i = 0; i < sizeof(result) / sizeof(*result); i++) | |||||
| result[i] *= 1000000.0f / (MATRIX_TABLE_SIZE * MATRIX_RUNS); | |||||
| Log::Info(" ns/elem\n"); | |||||
| Log::Info("mat4 = mat4 %7.3f\n", result[0]); | |||||
| Log::Info("float = mat4.det() %7.3f\n", result[1]); | |||||
| Log::Info("mat4 *= mat4 %7.3f\n", result[2]); | |||||
| Log::Info("mat4 += mat4 %7.3f\n", result[3]); | |||||
| Log::Info("mat4 = mat4.invert() %7.3f\n", result[4]); | |||||
| } | |||||
| static void bench_half(int mode) | |||||
| { | |||||
| float result[10] = { 0.0f }; | |||||
| Timer timer; | |||||
| /* Set up tables */ | |||||
| float *pf = new float[HALF_TABLE_SIZE + 1]; | |||||
| half *ph = new half[HALF_TABLE_SIZE + 1]; | |||||
| for (size_t run = 0; run < HALF_RUNS; run++) | for (size_t run = 0; run < HALF_RUNS; run++) | ||||
| { | { | ||||
| switch (mode) | |||||
| { | |||||
| case 1: | |||||
| for (size_t i = 0; i < HALF_TABLE_SIZE + 1; i++) | |||||
| ph[i] = half::makebits(rand()); | |||||
| break; | |||||
| case 2: | |||||
| for (size_t i = 0; i < HALF_TABLE_SIZE + 1; i++) | |||||
| ph[i] = RandF(-2.0f, 2.0f); | |||||
| break; | |||||
| } | |||||
| #if defined __EXCEPTIONS | |||||
| #error lol | |||||
| #endif | |||||
| /* Copy float */ | |||||
| timer.GetMs(); | |||||
| for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | |||||
| pf[i] = pf[i + 1]; | |||||
| result[0] += timer.GetMs(); | |||||
| /* Convert half to float (array) */ | /* Convert half to float (array) */ | ||||
| timer.GetMs(); | timer.GetMs(); | ||||
| half::convert(pf, ph, HALF_TABLE_SIZE); | half::convert(pf, ph, HALF_TABLE_SIZE); | ||||
| result[0] += timer.GetMs(); | |||||
| result[1] += timer.GetMs(); | |||||
| /* Convert half to float (fast) */ | /* Convert half to float (fast) */ | ||||
| timer.GetMs(); | timer.GetMs(); | ||||
| for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | ||||
| pf[i] = (float)ph[i]; | pf[i] = (float)ph[i]; | ||||
| result[1] += timer.GetMs(); | |||||
| /* Convert float to half (array) */ | |||||
| timer.GetMs(); | |||||
| half::convert(ph, pf, HALF_TABLE_SIZE); | |||||
| result[2] += timer.GetMs(); | result[2] += timer.GetMs(); | ||||
| /* Convert float to half (fast) */ | |||||
| /* Add a half to every float */ | |||||
| timer.GetMs(); | timer.GetMs(); | ||||
| for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | ||||
| ph[i] = (half)pf[i]; | |||||
| pf[i] += ph[i]; | |||||
| result[3] += timer.GetMs(); | result[3] += timer.GetMs(); | ||||
| /* Convert float to half (accurate) */ | |||||
| /* Copy half */ | |||||
| timer.GetMs(); | timer.GetMs(); | ||||
| for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | ||||
| ph[i] = half::makeaccurate(pf[i]); | |||||
| ph[i] = ph[i + 1]; | |||||
| result[4] += timer.GetMs(); | result[4] += timer.GetMs(); | ||||
| /* Change sign of every half */ | /* Change sign of every half */ | ||||
| @@ -97,33 +176,46 @@ static void bench_half(int mode) | |||||
| ph[i] = -ph[i]; | ph[i] = -ph[i]; | ||||
| result[5] += timer.GetMs(); | result[5] += timer.GetMs(); | ||||
| /* Add a half to every float */ | |||||
| /* Convert float to half (array) */ | |||||
| timer.GetMs(); | timer.GetMs(); | ||||
| for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | |||||
| pf[i] += ph[i]; | |||||
| half::convert(ph, pf, HALF_TABLE_SIZE); | |||||
| result[6] += timer.GetMs(); | result[6] += timer.GetMs(); | ||||
| /* Convert float to half (fast) */ | |||||
| timer.GetMs(); | |||||
| for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | |||||
| ph[i] = (half)pf[i]; | |||||
| result[7] += timer.GetMs(); | |||||
| /* Convert float to half (accurate) */ | |||||
| timer.GetMs(); | |||||
| for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | |||||
| ph[i] = half::makeaccurate(pf[i]); | |||||
| result[8] += timer.GetMs(); | |||||
| /* Add a float to every half */ | /* Add a float to every half */ | ||||
| timer.GetMs(); | timer.GetMs(); | ||||
| for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | for (size_t i = 0; i < HALF_TABLE_SIZE; i++) | ||||
| ph[i] += pf[i]; | ph[i] += pf[i]; | ||||
| result[7] += timer.GetMs(); | |||||
| result[9] += timer.GetMs(); | |||||
| } | } | ||||
| delete[]pf; | |||||
| delete[]ph; | |||||
| delete[] pf; | |||||
| delete[] ph; | |||||
| for (size_t i = 0; i < sizeof(result) / sizeof(*result); i++) | for (size_t i = 0; i < sizeof(result) / sizeof(*result); i++) | ||||
| result[i] *= 1000000.0f / (HALF_TABLE_SIZE * HALF_RUNS); | result[i] *= 1000000.0f / (HALF_TABLE_SIZE * HALF_RUNS); | ||||
| Log::Info(" ns/elem\n"); | Log::Info(" ns/elem\n"); | ||||
| Log::Info("float[] = half[] %7.3f\n", result[0]); | |||||
| Log::Info("float = half %7.3f\n", result[1]); | |||||
| Log::Info("half[] = float[] %7.3f\n", result[2]); | |||||
| Log::Info("half = float (fast) %7.3f\n", result[3]); | |||||
| Log::Info("half = float (accurate) %7.3f\n", result[4]); | |||||
| Log::Info("float = float %7.3f\n", result[0]); | |||||
| Log::Info("float = half (array) %7.3f\n", result[1]); | |||||
| Log::Info("float = half (fast) %7.3f\n", result[2]); | |||||
| Log::Info("float += half %7.3f\n", result[3]); | |||||
| Log::Info("half = half %7.3f\n", result[4]); | |||||
| Log::Info("half = -half %7.3f\n", result[5]); | Log::Info("half = -half %7.3f\n", result[5]); | ||||
| Log::Info("float += half %7.3f\n", result[6]); | |||||
| Log::Info("half += float %7.3f\n", result[7]); | |||||
| Log::Info("half = float (array) %7.3f\n", result[6]); | |||||
| Log::Info("half = float (fast) %7.3f\n", result[7]); | |||||
| Log::Info("half = float (accurate) %7.3f\n", result[8]); | |||||
| Log::Info("half += float %7.3f\n", result[9]); | |||||
| } | } | ||||