Browse Source

test: add matrix code to the benchmark program.

legacy
Sam Hocevar sam 13 years ago
parent
commit
782283a3d0
1 changed files with 135 additions and 43 deletions
  1. +135
    -43
      test/lol-bench.cpp

+ 135
- 43
test/lol-bench.cpp View File

@@ -20,75 +20,154 @@
using namespace std; using namespace std;
using namespace lol; using namespace lol;


static size_t const MATRIX_TABLE_SIZE = 64 * 1024;
static size_t const MATRIX_RUNS = 100;

static size_t const HALF_TABLE_SIZE = 1024 * 1024; static size_t const HALF_TABLE_SIZE = 1024 * 1024;
static size_t const HALF_RUNS = 100;
static size_t const HALF_RUNS = 50;


static void bench_matrix(int mode);
static void bench_half(int mode); static void bench_half(int mode);


int main(int argc, char **argv) int main(int argc, char **argv)
{ {
Log::Info("-----------------------------------\n");
Log::Info("Half precision floats (random bits)\n");
Log::Info("-----------------------------------\n");
Log::Info("----------------------------\n");
Log::Info(" Float matrices [-2.0, 2.0]\n");
Log::Info("----------------------------\n");
bench_matrix(1);

Log::Info("-------------------------------------\n");
Log::Info(" Half precision floats (random bits)\n");
Log::Info("-------------------------------------\n");
bench_half(1); bench_half(1);


Log::Info("---------------------------------\n");
Log::Info("Half precision floats [-2.0, 2.0]\n");
Log::Info("---------------------------------\n");
Log::Info("-----------------------------------\n");
Log::Info(" Half precision floats [-2.0, 2.0]\n");
Log::Info("-----------------------------------\n");
bench_half(2); bench_half(2);


return EXIT_SUCCESS; return EXIT_SUCCESS;
} }


static void bench_half(int mode)
static void bench_matrix(int mode)
{ {
float result[8] = { 0.0f };
float result[5] = { 0.0f };
Timer timer; Timer timer;


/* Set up tables */ /* Set up tables */
float *pf = new float[HALF_TABLE_SIZE];
half *ph = new half[HALF_TABLE_SIZE];
mat4 *pm = new mat4[MATRIX_TABLE_SIZE + 1];
float *pf = new float[MATRIX_TABLE_SIZE];


switch (mode)
for (size_t run = 0; run < MATRIX_RUNS; run++)
{ {
case 1:
for (size_t i = 0; i < HALF_TABLE_SIZE; i++)
ph[i] = half::makebits(rand());
break;
case 2:
for (size_t i = 0; i < HALF_TABLE_SIZE; i++)
ph[i] = RandF(-2.0f, 2.0f);
break;
switch (mode)
{
case 1:
for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++)
for (int j = 0; j < 4; j++)
for (int k = 0; k < 4; k++)
pm[i][j][k] = RandF(-2.0f, 2.0f);
break;
}

/* Copy matrices */
timer.GetMs();
for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++)
pm[i] = pm[i + 1];
result[0] += timer.GetMs();

/* Determinant */
timer.GetMs();
for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++)
pf[i] = pm[i].det();
result[1] += timer.GetMs();

/* Multiply matrices */
timer.GetMs();
for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++)
pm[i] *= pm[i + 1];
result[2] += timer.GetMs();

/* Add matrices */
timer.GetMs();
for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++)
pm[i] += pm[i + 1];
result[3] += timer.GetMs();

/* Invert matrix */
timer.GetMs();
for (size_t i = 0; i < MATRIX_TABLE_SIZE; i++)
pm[i] = pm[i].invert();
result[4] += timer.GetMs();
} }


delete[] pm;
delete[] pf;

for (size_t i = 0; i < sizeof(result) / sizeof(*result); i++)
result[i] *= 1000000.0f / (MATRIX_TABLE_SIZE * MATRIX_RUNS);

Log::Info(" ns/elem\n");
Log::Info("mat4 = mat4 %7.3f\n", result[0]);
Log::Info("float = mat4.det() %7.3f\n", result[1]);
Log::Info("mat4 *= mat4 %7.3f\n", result[2]);
Log::Info("mat4 += mat4 %7.3f\n", result[3]);
Log::Info("mat4 = mat4.invert() %7.3f\n", result[4]);
}

static void bench_half(int mode)
{
float result[10] = { 0.0f };
Timer timer;

/* Set up tables */
float *pf = new float[HALF_TABLE_SIZE + 1];
half *ph = new half[HALF_TABLE_SIZE + 1];

for (size_t run = 0; run < HALF_RUNS; run++) for (size_t run = 0; run < HALF_RUNS; run++)
{ {
switch (mode)
{
case 1:
for (size_t i = 0; i < HALF_TABLE_SIZE + 1; i++)
ph[i] = half::makebits(rand());
break;
case 2:
for (size_t i = 0; i < HALF_TABLE_SIZE + 1; i++)
ph[i] = RandF(-2.0f, 2.0f);
break;
}
#if defined __EXCEPTIONS
#error lol
#endif

/* Copy float */
timer.GetMs();
for (size_t i = 0; i < HALF_TABLE_SIZE; i++)
pf[i] = pf[i + 1];
result[0] += timer.GetMs();

/* Convert half to float (array) */ /* Convert half to float (array) */
timer.GetMs(); timer.GetMs();
half::convert(pf, ph, HALF_TABLE_SIZE); half::convert(pf, ph, HALF_TABLE_SIZE);
result[0] += timer.GetMs();
result[1] += timer.GetMs();


/* Convert half to float (fast) */ /* Convert half to float (fast) */
timer.GetMs(); timer.GetMs();
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) for (size_t i = 0; i < HALF_TABLE_SIZE; i++)
pf[i] = (float)ph[i]; pf[i] = (float)ph[i];
result[1] += timer.GetMs();

/* Convert float to half (array) */
timer.GetMs();
half::convert(ph, pf, HALF_TABLE_SIZE);
result[2] += timer.GetMs(); result[2] += timer.GetMs();


/* Convert float to half (fast) */
/* Add a half to every float */
timer.GetMs(); timer.GetMs();
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) for (size_t i = 0; i < HALF_TABLE_SIZE; i++)
ph[i] = (half)pf[i];
pf[i] += ph[i];
result[3] += timer.GetMs(); result[3] += timer.GetMs();


/* Convert float to half (accurate) */
/* Copy half */
timer.GetMs(); timer.GetMs();
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) for (size_t i = 0; i < HALF_TABLE_SIZE; i++)
ph[i] = half::makeaccurate(pf[i]);
ph[i] = ph[i + 1];
result[4] += timer.GetMs(); result[4] += timer.GetMs();


/* Change sign of every half */ /* Change sign of every half */
@@ -97,33 +176,46 @@ static void bench_half(int mode)
ph[i] = -ph[i]; ph[i] = -ph[i];
result[5] += timer.GetMs(); result[5] += timer.GetMs();


/* Add a half to every float */
/* Convert float to half (array) */
timer.GetMs(); timer.GetMs();
for (size_t i = 0; i < HALF_TABLE_SIZE; i++)
pf[i] += ph[i];
half::convert(ph, pf, HALF_TABLE_SIZE);
result[6] += timer.GetMs(); result[6] += timer.GetMs();


/* Convert float to half (fast) */
timer.GetMs();
for (size_t i = 0; i < HALF_TABLE_SIZE; i++)
ph[i] = (half)pf[i];
result[7] += timer.GetMs();

/* Convert float to half (accurate) */
timer.GetMs();
for (size_t i = 0; i < HALF_TABLE_SIZE; i++)
ph[i] = half::makeaccurate(pf[i]);
result[8] += timer.GetMs();

/* Add a float to every half */ /* Add a float to every half */
timer.GetMs(); timer.GetMs();
for (size_t i = 0; i < HALF_TABLE_SIZE; i++) for (size_t i = 0; i < HALF_TABLE_SIZE; i++)
ph[i] += pf[i]; ph[i] += pf[i];
result[7] += timer.GetMs();
result[9] += timer.GetMs();
} }


delete[]pf;
delete[]ph;
delete[] pf;
delete[] ph;


for (size_t i = 0; i < sizeof(result) / sizeof(*result); i++) for (size_t i = 0; i < sizeof(result) / sizeof(*result); i++)
result[i] *= 1000000.0f / (HALF_TABLE_SIZE * HALF_RUNS); result[i] *= 1000000.0f / (HALF_TABLE_SIZE * HALF_RUNS);


Log::Info(" ns/elem\n"); Log::Info(" ns/elem\n");
Log::Info("float[] = half[] %7.3f\n", result[0]);
Log::Info("float = half %7.3f\n", result[1]);
Log::Info("half[] = float[] %7.3f\n", result[2]);
Log::Info("half = float (fast) %7.3f\n", result[3]);
Log::Info("half = float (accurate) %7.3f\n", result[4]);
Log::Info("float = float %7.3f\n", result[0]);
Log::Info("float = half (array) %7.3f\n", result[1]);
Log::Info("float = half (fast) %7.3f\n", result[2]);
Log::Info("float += half %7.3f\n", result[3]);
Log::Info("half = half %7.3f\n", result[4]);
Log::Info("half = -half %7.3f\n", result[5]); Log::Info("half = -half %7.3f\n", result[5]);
Log::Info("float += half %7.3f\n", result[6]);
Log::Info("half += float %7.3f\n", result[7]);
Log::Info("half = float (array) %7.3f\n", result[6]);
Log::Info("half = float (fast) %7.3f\n", result[7]);
Log::Info("half = float (accurate) %7.3f\n", result[8]);
Log::Info("half += float %7.3f\n", result[9]);
} }



Loading…
Cancel
Save