Application Article
A High-Performance Parallel FDTD Method Enhanced by Using SSE Instruction Set
| //allocate the 1D memory | | array_name_tmp = (float*)_aligned_malloc( | | sizeof (float) * x_size * y_size * z_size, 16); | | array_name = (float ***)_aligned_malloc ( | | sizeof (float**) * x_size, 16); | | for(i = 0; i < x_size; i++)
{
| | array_name [i] = (float **)_aligned_malloc | | (sizeof (float*) * y_size, 16); | | for(j = 0; j < y_size; j++)
{
| | //map the 1D memory address to 3D array | | map_address = i * y_size * z_size + j * z_size; | | array_name [i][j] = &array_name_tmp [map_address]; | |
|