diff --git a/src/TpHostGpu.cu b/src/TpHostGpu.cu index 6cd44604d12e3c5d8ec86970661ed2b5e28fca76..4a471096f2fe0ca6324b57f4aae486c682ef8c0c 100644 --- a/src/TpHostGpu.cu +++ b/src/TpHostGpu.cu @@ -893,7 +893,8 @@ void TpHostGpu::testCorrelate2DIntraTD (int num_runs, int quad_combine){ // 886 (corr_size_combo * corr_size_combo) * sizeof(float), num_corr_combo, cudaMemcpyDeviceToHost)); - printf("Writing phase correlation data to %s\n", m_tpPaths.result_corr_quad_file); + printf("Writing phase correlation data to %s (%d x %d - not an image) \n", m_tpPaths.result_corr_quad_file, + (m_tpParams.tilesx * corr_size_combo),(m_tpParams.tilesya * corr_size_combo)); writeFloatsToFile( cpu_corr_combo, // float * data, // allocated array rslt_corr_size_combo, // int size, // length in elements @@ -906,17 +907,9 @@ void TpHostGpu::testCorrelate2DIntraTD (int num_runs, int quad_combine){ // 886 m_gpu_num_corr_tiles, sizeof(int), cudaMemcpyDeviceToHost)); - // printf("Average CORR run time =%f ms, num cor tiles (new) = %d\n", avgTimeCORR, num_corrs); - - // int corr_size = 2 * CORR_OUT_RAD + 1; - // int rslt_corr_size = num_corrs * corr_size * corr_size; - // float * cpu_corr = (float *)malloc(rslt_corr_size * sizeof(float)); - -// int num_corr_indices = num_pairs_inter * m_tpParams.num_tiles; int num_corr_indices = m_tpParams.num_pairs * m_tpParams.num_tiles; int rslt_corr_size = num_corrs * m_tpParams.corr_length; // corr_size * corr_size; int corr_img_size = num_corr_indices * 16*16; // NAN -// float * corr_img = (float *)malloc(corr_img_size * sizeof(float)); float * cpu_corr = (float *)malloc(rslt_corr_size * sizeof(float)); int * cpu_corr_indices = (int *) malloc(num_corr_indices * sizeof(int)); checkCudaErrors(cudaMemcpy2D( @@ -964,7 +957,8 @@ void TpHostGpu::testCorrelate2DIntraTD (int num_runs, int quad_combine){ // 886 cpu_corr_td, // float * cpu_corr, 16); // num_sel_sensors); // int num_sel_sensors) // // Will not be used - printf("Writing intrascene phase correlation TD data tp %s\n", m_tpPaths.result_intrascene_td); + printf("Writing intrascene phase correlation TD data tp %s (%d x %d x %d)\n", m_tpPaths.result_intrascene_td, + (m_tpParams.tilesx * 16),(m_tpParams.tilesya*16), m_tpParams.num_pairs); writeFloatsToFile( corr_img_td, // float * data, // allocated array corr_img_size, // int size, // length in elements @@ -1268,9 +1262,9 @@ void TpHostGpu::testTextures ( gpu_pnum_texture_tiles, sizeof(int), cudaMemcpyDeviceToHost)); - printf("cpu_pnum_texture_tiles = %d\n", cpu_pnum_texture_tiles); - printf("tile_texture_layers = %d\n", m_tile_texture_layers); } // if (use_dp) { + printf("cpu_pnum_texture_tiles = %d\n", cpu_pnum_texture_tiles); + printf("tile_texture_layers = %d\n", m_tile_texture_layers); int rslt_texture_size = m_num_textures * m_tile_texture_size; @@ -1328,29 +1322,20 @@ void TpHostGpu::testTextures ( cpu_diff_rgb_combo_out[nl * ntiles + ntile] = cpu_diff_rgb_combo[ntile * nlayers + nl]; } } - if (!use_dp) { - printf("Writing phase texture data to %s\n", m_tpPaths.result_textures_file); - writeFloatsToFile( - non_overlap_layers, // float * data, // allocated array - rslt_texture_size, // int size, // length in elements - m_tpPaths.result_textures_file); // const char * path) // file path - printf("Writing low-res data to %s\n", m_tpPaths.result_diff_rgb_combo_file); - writeFloatsToFile( - cpu_diff_rgb_combo_out, // cpu_diff_rgb_combo, // float * data, // allocated array - diff_rgb_combo_size, // int size, // length in elements - m_tpPaths.result_diff_rgb_combo_file); // const char * path) // file path - } else { // if (!use_dp) { - printf("Writing phase texture data to %s\n", m_tpPaths.result_textures_file_dp); - writeFloatsToFile( - non_overlap_layers, // float * data, // allocated array - rslt_texture_size, // int size, // length in elements - m_tpPaths.result_textures_file_dp); // const char * path) // file path - printf("Writing low-res data to %s\n", m_tpPaths.result_diff_rgb_combo_file_dp); - writeFloatsToFile( - cpu_diff_rgb_combo_out, // cpu_diff_rgb_combo, // float * data, // allocated array - diff_rgb_combo_size, // int size, // length in elements - m_tpPaths.result_diff_rgb_combo_file_dp); // const char * path) // file path - } // if (!use_dp) { else + const char * result_textures_file = use_dp ? m_tpPaths.result_textures_file_dp : m_tpPaths.result_textures_file; + const char * result_diff_rgb_combo_file = use_dp ? m_tpPaths.result_diff_rgb_combo_file_dp : m_tpPaths.result_diff_rgb_combo_file; + printf("Writing phase texture data to %s (%d x % d x %d)\n", result_textures_file, + m_tpParams.tilesx * m_tpParams.dtt_size2, m_tpParams.tilesy * m_tpParams.dtt_size2, m_tile_texture_layers); + writeFloatsToFile( + non_overlap_layers, // float * data, // allocated array + rslt_texture_size, // int size, // length in elements + result_textures_file); // const char * path) // file path + printf("Writing low-res data to %s (%d x %d x %d)\n", result_diff_rgb_combo_file, + m_tpParams.tilesx, m_tpParams.tilesy, nlayers); + writeFloatsToFile( + cpu_diff_rgb_combo_out, // cpu_diff_rgb_combo, // float * data, // allocated array + diff_rgb_combo_size, // int size, // length in elements + result_diff_rgb_combo_file); // const char * path) // file path if ( m_tpParams.debug_tile) { if (debug) { int texture_offset = m_tpParams.dbg_tile * m_tile_texture_size; @@ -1518,19 +1503,14 @@ void TpHostGpu::testTexturesRGBA ( rgba_height * rbga_slices, cudaMemcpyDeviceToHost)); printf("Import raw, real, little-endian, 18 images 648x520\n"); - if (!use_dp) { - printf("Writing RBGA texture slices to %s\n", m_tpPaths.result_textures_rgba_file); - writeFloatsToFile( - cpu_textures_rgba, // float * data, // allocated array - rslt_rgba_size, // int size, // length in elements - m_tpPaths.result_textures_rgba_file); // const char * path) // file path - } else { // if (use_dp) { - printf("Writing RBGA texture slices to %s\n", m_tpPaths.result_textures_rgba_file_dp); + const char * result_textures_rgba_file = use_dp ? m_tpPaths.result_textures_rgba_file_dp : m_tpPaths.result_textures_rgba_file; + + printf("Writing RBGA texture slices to %s (%d x %d x %d)\n", result_textures_rgba_file, + rgba_woi_width, rgba_woi_height, rbga_slices); writeFloatsToFile( cpu_textures_rgba, // float * data, // allocated array rslt_rgba_size, // int size, // length in elements - m_tpPaths.result_textures_rgba_file_dp); // const char * path) // file path - } // if (use_dp) { // else + result_textures_rgba_file); // const char * path) // file path if ( m_tpParams.debug_tile) { if (debug) { @@ -1565,7 +1545,7 @@ void TpHostGpu::saveClt( m_gpu_clt_h[ncam], rslt_size * sizeof(float), cudaMemcpyDeviceToHost)); - printf("Writing %s to %s\n", prompt, paths[ncam]); + printf("Writing %s to %s (%d * %d * 4 * %d * %d)\n", prompt, paths[ncam], m_tpParams.tilesx, m_tpParams.tilesy, m_tpParams.dtt_size, m_tpParams.dtt_size); writeFloatsToFile(cpu_clt, // float * data, // allocated array rslt_size, // int size, // length in elements paths[ncam]); // const char * path) // file path @@ -1589,7 +1569,8 @@ void TpHostGpu::saveRgb( (m_tpParams.img_width + m_tpParams.dtt_size) * sizeof(float), m_tpParams.num_colors* (m_tpParams.img_height + m_tpParams.dtt_size), cudaMemcpyDeviceToHost)); - printf("Writing %s to %s\n", prompt, paths[ncam]); + printf("Writing %s to %s (%d * %d * %d)\n", prompt, paths[ncam], + (m_tpParams.img_width + m_tpParams.dtt_size), (m_tpParams.img_height + m_tpParams.dtt_size), m_tpParams.num_colors); writeFloatsToFile( // will have margins cpu_corr_image, // float * data, // allocated array rslt_img_size, // int size, // length in elements @@ -1689,7 +1670,9 @@ void TpHostGpu::saveInterCorrFile( cpu_corr_indices, // int * cpu_corr_indices, cpu_corr_td, // float * cpu_corr, num_sel_sensors); // int num_sel_sensors) - printf("Writing %s TD data to %s\n", prompt, path); + int num_slices = num_corr_indices / (m_tpParams.tilesx * m_tpParams.tilesy); + printf("Writing %s TD data to %s (%d x %d x %d)\n", prompt, path, + m_tpParams.tilesx * m_tpParams.dtt_size2 , m_tpParams.tilesy * m_tpParams.dtt_size2 , num_slices); writeFloatsToFile( corr_img_td, // float * data, // allocated array corr_img_size, // int size, // length in elements @@ -1727,11 +1710,13 @@ void TpHostGpu::saveInterCorrIndicesFile( int tx = ctt % m_tpParams.tilesx; corr_index_img[cpair * m_tpParams.tilesx * m_tpParams.tilesy + m_tpParams.tilesx * ty + tx] = ict; // cpu_corr_indices[ict]; } - printf("Writing %s to %s\n",prompt,path); + int num_slices = num_corr_indices / (m_tpParams.tilesx * m_tpParams.tilesy); + printf("Writing %s to %s (%d x %d x %d - not an image)\n",prompt,path, + m_tpParams.tilesx, m_tpParams.tilesy, num_slices); writeFloatsToFile( corr_index_img, // float * data, // allocated array corr_index_img_length, // int size, // length in elements - "clt/aux_inter-indices.raw"); // const char * path) // file path + path); // const char * path) // file path free (corr_index_img); free (cpu_corr_indices); } diff --git a/src/test_tp.cu b/src/test_tp.cu index c88b12353559c479be2e47a26df3cd83578c7c88..194013283d4f3cf5c289b94fae8f01bce96cdd03 100644 --- a/src/test_tp.cu +++ b/src/test_tp.cu @@ -126,7 +126,7 @@ int main(int argc, char **argv) 0.0, // const float target_disparity, // DBG_DISPARITY == 0.0 0.0, // const float scale, // 0.0 0, // int quad_combine, - 0, // int use_dp, + 1, // int use_dp, 0); // int debug); return 0; /* */