|
|
@@ -20,75 +20,154 @@ |
|
|
|
using namespace std; |
|
|
|
using namespace lol; |
|
|
|
|
|
|
|
static size_t const MATRIX_TABLE_SIZE = 64 * 1024; |
|
|
|
static size_t const MATRIX_RUNS = 100; |
|
|
|
|
|
|
|
static size_t const HALF_TABLE_SIZE = 1024 * 1024; |
|
|
|
static size_t const HALF_RUNS = 100; |
|
|
|
static size_t const HALF_RUNS = 50; |
|
|
|
|
|
|
|
static void bench_matrix(int mode); |
|
|
|
static void bench_half(int mode); |
|
|
|
|
|
|
|
int main(int argc, char **argv) |
|
|
|
{ |
|
|
|
Log::Info("-----------------------------------\n"); |
|
|
|
Log::Info("Half precision floats (random bits)\n"); |
|
|
|
Log::Info("-----------------------------------\n"); |
|
|
|
Log::Info("----------------------------\n"); |
|
|
|
Log::Info(" Float matrices [-2.0, 2.0]\n"); |
|
|
|
Log::Info("----------------------------\n"); |
|
|
|
bench_matrix(1); |
|
|
|
|
|
|
|
Log::Info("-------------------------------------\n"); |
|
|
|
Log::Info(" Half precision floats (random bits)\n"); |
|
|
|
Log::Info("-------------------------------------\n"); |
|
|
|
bench_half(1); |
|
|
|
|
|
|
|
Log::Info("---------------------------------\n"); |
|
|
|
Log::Info("Half precision floats [-2.0, 2.0]\n"); |
|
|
|
Log::Info("---------------------------------\n"); |
|
|
|
Log::Info("-----------------------------------\n"); |
|
|
|
Log::Info(" Half precision floats [-2.0, 2.0]\n"); |
|
|
|
Log::Info("-----------------------------------\n"); |
|
|
|
bench_half(2); |
|
|
|
|
|
|
|
return EXIT_SUCCESS; |
|
|
|
} |
|
|
|
|
|
|
|
static void bench_half(int mode) |
|
|
|
static void bench_matrix(int mode) |
|
|
|
{ |
|
|
|
float result[8] = { 0.0f }; |
|
|
|
float result[5] = { 0.0f }; |
|
|
|
Timer timer; |
|
|
|
|
|
|
|
/* Set up tables */ |
|
|
|
float *pf = new float[HALF_TABLE_SIZE]; |
|
|
|
half *ph = new half[HALF_TABLE_SIZE]; |
|
|
|
mat4 *pm = new mat4[MATRIX_TABLE_SIZE + 1]; |
|
|
|
float *pf = new float[MATRIX_TABLE_SIZE]; |
|
|
|
|
|
|
|
switch (mode) |
|
|
|
for (size_t run = 0; run < MATRIX_RUNS; run++) |
|
|
|
{ |
|
|
|
case 1: |
|
|
|
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) |
|
|
|
ph[i] = half::makebits(rand()); |
|
|
|
break; |
|
|
|
case 2: |
|
|
|
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) |
|
|
|
ph[i] = RandF(-2.0f, 2.0f); |
|
|
|
break; |
|
|
|
switch (mode) |
|
|
|
{ |
|
|
|
case 1: |
|
|
|
for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++) |
|
|
|
for (int j = 0; j < 4; j++) |
|
|
|
for (int k = 0; k < 4; k++) |
|
|
|
pm[i][j][k] = RandF(-2.0f, 2.0f); |
|
|
|
break; |
|
|
|
} |
|
|
|
|
|
|
|
/* Copy matrices */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++) |
|
|
|
pm[i] = pm[i + 1]; |
|
|
|
result[0] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Determinant */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++) |
|
|
|
pf[i] = pm[i].det(); |
|
|
|
result[1] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Multiply matrices */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++) |
|
|
|
pm[i] *= pm[i + 1]; |
|
|
|
result[2] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Add matrices */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++) |
|
|
|
pm[i] += pm[i + 1]; |
|
|
|
result[3] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Invert matrix */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++) |
|
|
|
pm[i] = pm[i].invert(); |
|
|
|
result[4] += timer.GetMs(); |
|
|
|
} |
|
|
|
|
|
|
|
delete[] pm; |
|
|
|
delete[] pf; |
|
|
|
|
|
|
|
for (size_t i = 0; i < sizeof(result) / sizeof(*result); i++) |
|
|
|
result[i] *= 1000000.0f / (MATRIX_TABLE_SIZE * MATRIX_RUNS); |
|
|
|
|
|
|
|
Log::Info(" ns/elem\n"); |
|
|
|
Log::Info("mat4 = mat4 %7.3f\n", result[0]); |
|
|
|
Log::Info("float = mat4.det() %7.3f\n", result[1]); |
|
|
|
Log::Info("mat4 *= mat4 %7.3f\n", result[2]); |
|
|
|
Log::Info("mat4 += mat4 %7.3f\n", result[3]); |
|
|
|
Log::Info("mat4 = mat4.invert() %7.3f\n", result[4]); |
|
|
|
} |
|
|
|
|
|
|
|
static void bench_half(int mode) |
|
|
|
{ |
|
|
|
float result[10] = { 0.0f }; |
|
|
|
Timer timer; |
|
|
|
|
|
|
|
/* Set up tables */ |
|
|
|
float *pf = new float[HALF_TABLE_SIZE + 1]; |
|
|
|
half *ph = new half[HALF_TABLE_SIZE + 1]; |
|
|
|
|
|
|
|
for (size_t run = 0; run < HALF_RUNS; run++) |
|
|
|
{ |
|
|
|
switch (mode) |
|
|
|
{ |
|
|
|
case 1: |
|
|
|
for (size_t i = 0; i < HALF_TABLE_SIZE + 1; i++) |
|
|
|
ph[i] = half::makebits(rand()); |
|
|
|
break; |
|
|
|
case 2: |
|
|
|
for (size_t i = 0; i < HALF_TABLE_SIZE + 1; i++) |
|
|
|
ph[i] = RandF(-2.0f, 2.0f); |
|
|
|
break; |
|
|
|
} |
|
|
|
#if defined __EXCEPTIONS |
|
|
|
#error lol |
|
|
|
#endif |
|
|
|
|
|
|
|
/* Copy float */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) |
|
|
|
pf[i] = pf[i + 1]; |
|
|
|
result[0] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Convert half to float (array) */ |
|
|
|
timer.GetMs(); |
|
|
|
half::convert(pf, ph, HALF_TABLE_SIZE); |
|
|
|
result[0] += timer.GetMs(); |
|
|
|
result[1] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Convert half to float (fast) */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) |
|
|
|
pf[i] = (float)ph[i]; |
|
|
|
result[1] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Convert float to half (array) */ |
|
|
|
timer.GetMs(); |
|
|
|
half::convert(ph, pf, HALF_TABLE_SIZE); |
|
|
|
result[2] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Convert float to half (fast) */ |
|
|
|
/* Add a half to every float */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) |
|
|
|
ph[i] = (half)pf[i]; |
|
|
|
pf[i] += ph[i]; |
|
|
|
result[3] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Convert float to half (accurate) */ |
|
|
|
/* Copy half */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) |
|
|
|
ph[i] = half::makeaccurate(pf[i]); |
|
|
|
ph[i] = ph[i + 1]; |
|
|
|
result[4] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Change sign of every half */ |
|
|
@@ -97,33 +176,46 @@ static void bench_half(int mode) |
|
|
|
ph[i] = -ph[i]; |
|
|
|
result[5] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Add a half to every float */ |
|
|
|
/* Convert float to half (array) */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) |
|
|
|
pf[i] += ph[i]; |
|
|
|
half::convert(ph, pf, HALF_TABLE_SIZE); |
|
|
|
result[6] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Convert float to half (fast) */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) |
|
|
|
ph[i] = (half)pf[i]; |
|
|
|
result[7] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Convert float to half (accurate) */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) |
|
|
|
ph[i] = half::makeaccurate(pf[i]); |
|
|
|
result[8] += timer.GetMs(); |
|
|
|
|
|
|
|
/* Add a float to every half */ |
|
|
|
timer.GetMs(); |
|
|
|
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) |
|
|
|
ph[i] += pf[i]; |
|
|
|
result[7] += timer.GetMs(); |
|
|
|
result[9] += timer.GetMs(); |
|
|
|
} |
|
|
|
|
|
|
|
delete[]pf; |
|
|
|
delete[]ph; |
|
|
|
delete[] pf; |
|
|
|
delete[] ph; |
|
|
|
|
|
|
|
for (size_t i = 0; i < sizeof(result) / sizeof(*result); i++) |
|
|
|
result[i] *= 1000000.0f / (HALF_TABLE_SIZE * HALF_RUNS); |
|
|
|
|
|
|
|
Log::Info(" ns/elem\n"); |
|
|
|
Log::Info("float[] = half[] %7.3f\n", result[0]); |
|
|
|
Log::Info("float = half %7.3f\n", result[1]); |
|
|
|
Log::Info("half[] = float[] %7.3f\n", result[2]); |
|
|
|
Log::Info("half = float (fast) %7.3f\n", result[3]); |
|
|
|
Log::Info("half = float (accurate) %7.3f\n", result[4]); |
|
|
|
Log::Info("float = float %7.3f\n", result[0]); |
|
|
|
Log::Info("float = half (array) %7.3f\n", result[1]); |
|
|
|
Log::Info("float = half (fast) %7.3f\n", result[2]); |
|
|
|
Log::Info("float += half %7.3f\n", result[3]); |
|
|
|
Log::Info("half = half %7.3f\n", result[4]); |
|
|
|
Log::Info("half = -half %7.3f\n", result[5]); |
|
|
|
Log::Info("float += half %7.3f\n", result[6]); |
|
|
|
Log::Info("half += float %7.3f\n", result[7]); |
|
|
|
Log::Info("half = float (array) %7.3f\n", result[6]); |
|
|
|
Log::Info("half = float (fast) %7.3f\n", result[7]); |
|
|
|
Log::Info("half = float (accurate) %7.3f\n", result[8]); |
|
|
|
Log::Info("half += float %7.3f\n", result[9]); |
|
|
|
} |
|
|
|
|