gatk-3.8/public/VectorPairHMM/src/main/c++/utils.h

/*Copyright (c) 2012 The Broad Institute

*Permission is hereby granted, free of charge, to any person
*obtaining a copy of this software and associated documentation
*files (the "Software"), to deal in the Software without
*restriction, including without limitation the rights to use,
*copy, modify, merge, publish, distribute, sublicense, and/or sell
*copies of the Software, and to permit persons to whom the
*Software is furnished to do so, subject to the following
*conditions:

*The above copyright notice and this permission notice shall be
*included in all copies or substantial portions of the Software.

*THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
*EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
*OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
*NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
*HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
*WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
*FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR
*THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*/


#ifndef PAIRHMM_UTIL_H
#define PAIRHMM_UTIL_H

#include "common_data_structure.h"

template<class T>
std::string to_string(T obj)
{
  std::stringstream ss;
  std::string ret_string;
  ss.clear();
  ss << std::scientific << obj;
  ss >> ret_string;
  ss.clear();
  return ret_string;
}
void debug_dump(std::string filename, std::string s, bool to_append, bool add_newline=true);

int read_mod_testcase(std::ifstream& fptr, testcase* tc, bool reformat=false);

bool is_avx_supported();
bool is_sse42_supported();
extern float (*g_compute_full_prob_float)(testcase *tc, float *before_last_log);
extern double (*g_compute_full_prob_double)(testcase *tc, double* before_last_log);
void debug_dump(std::string filename, std::string s, bool to_append, bool add_newline);
template<class NUMBER>
NUMBER compute_full_prob(testcase *tc, NUMBER *before_last_log=0);
template<class NUMBER>
NUMBER compute_full_prob_avxd(testcase *tc, NUMBER *before_last_log=0);
template<class NUMBER>
NUMBER compute_full_prob_avxs(testcase *tc, NUMBER *before_last_log=0);
template<class NUMBER>
NUMBER compute_full_prob_ssed(testcase *tc, NUMBER *before_last_log=0);
template<class NUMBER>
NUMBER compute_full_prob_sses(testcase *tc, NUMBER *before_last_log=0);

double getCurrClk();
void get_time(struct timespec* x);
uint64_t diff_time(struct timespec& prev_time);

//bit 0 is sse4.2, bit 1 is AVX
enum ProcessorCapabilitiesEnum
{
  SSE41_CUSTOM_IDX=0,
  SSE42_CUSTOM_IDX,
  AVX_CUSTOM_IDX
};
#define ENABLE_ALL_HARDWARE_FEATURES 0xFFFFFFFFFFFFFFFFull
uint64_t get_machine_capabilities();
void initialize_function_pointers(uint64_t mask=ENABLE_ALL_HARDWARE_FEATURES);
void do_compute(char* filename, bool use_old_read_testcase=true, unsigned chunk_size=10000, bool do_check=true);

//#define DO_WARMUP
//#define DO_REPEAT_PROFILING
/*#define DUMP_COMPUTE_VALUES 1*/
#define BATCH_SIZE  10000
#define RUN_HYBRID
/*#define PRINT_PER_INTERVAL_TIMINGS 1*/

#endif
Added public license text to all C++ files 2014-03-04 01:04:00 +08:00			`/*Copyright (c) 2012 The Broad Institute`

			`*Permission is hereby granted, free of charge, to any person`
			`*obtaining a copy of this software and associated documentation`
			`*files (the "Software"), to deal in the Software without`
			`*restriction, including without limitation the rights to use,`
			`*copy, modify, merge, publish, distribute, sublicense, and/or sell`
			`*copies of the Software, and to permit persons to whom the`
			`*Software is furnished to do so, subject to the following`
			`*conditions:`

			`*The above copyright notice and this permission notice shall be`
			`*included in all copies or substantial portions of the Software.`

			`*THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,`
			`*EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES`
			`*OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND`
			`*NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT`
			`*HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,`
			`*WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING`
			`*FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR`
			`*THE USE OR OTHER DEALINGS IN THE SOFTWARE.`
			`*/`


Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00			`#ifndef PAIRHMM_UTIL_H`
			`#define PAIRHMM_UTIL_H`

Parallel version of the JNI for the PairHMM The JNI treats shared memory as critical memory and doesn't allow any parallel reads or writes to it until the native code finishes. This is not a problem per se it is the right thing to do, but we need to enable -nct when running the haplotype caller and with it have multiple native PairHMM running for each map call. Move to a copy based memory sharing where the JNI simply copies the memory over to C++ and then has no blocked critical memory when running, allowing -nct to work. This version is slightly (almost unnoticeably) slower with -nct 1, but scales better with -nct 2-4 (we haven't tested anything beyond that because we know the GATK falls apart with higher levels of parallelism * Make VECTOR_LOGLESS_CACHING the default implementation for PairHMM. * Changed version number in pom.xml under public/VectorPairHMM * VectorPairHMM can now be compiled using gcc 4.8.x * Modified define-* to get rid of gcc warnings for extra tokens after #undefs * Added a Linux kernel version check for AVX - gcc's __builtin_cpu_supports function does not check whether the kernel supports AVX or not. * Updated PairHMM profiling code to update and print numbers only in single-thread mode * Edited README.md, pom.xml and Makefile for users to pass path to gcc 4.8.x if necessary * Moved all cpuid inline assembly to single function Changed info message to clog from cinfo * Modified version in pom.xml in VectorPairHMM from 3.1 to 3.2 * Deleted some unnecessary code * Modified C++ sandbox to print per interval timing 2014-03-18 02:42:19 +08:00			`#include "common_data_structure.h"`
1. Integrated Mohammad's SSE4.2 code, Mustafa's bug fix and code to fix the SSE compilation warning. 2. Added code to dynamically select between AVX, SSE4.2 and normal C++ (in that order) 3. Created multiple files to compile with different compilation flags: avx_function_prototypes.cc is compiled with -xAVX while sse_function_instantiations.cc is compiled with -xSSE4.2 flag. 4. Added jniClose() and support in Java (HaplotypeCaller, PairHMMLikelihoodCalculationEngine) to call this function at the end of the program. 5. Removed debug code, kept assertions and profiling in C++ 6. Disabled OpenMP for now. 2014-01-21 00:03:42 +08:00
			`template<class T>`
			`std::string to_string(T obj)`
			`{`
			`std::stringstream ss;`
			`std::string ret_string;`
			`ss.clear();`
			`ss << std::scientific << obj;`
			`ss >> ret_string;`
			`ss.clear();`
			`return ret_string;`
			`}`
			`void debug_dump(std::string filename, std::string s, bool to_append, bool add_newline=true);`

			`int read_mod_testcase(std::ifstream& fptr, testcase* tc, bool reformat=false);`

Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00			`bool is_avx_supported();`
			`bool is_sse42_supported();`
			`extern float (g_compute_full_prob_float)(testcase tc, float *before_last_log);`
			`extern double (g_compute_full_prob_double)(testcase tc, double* before_last_log);`
			`void debug_dump(std::string filename, std::string s, bool to_append, bool add_newline);`
			`template<class NUMBER>`
			`NUMBER compute_full_prob(testcase tc, NUMBER before_last_log=0);`
Parallel version of the JNI for the PairHMM The JNI treats shared memory as critical memory and doesn't allow any parallel reads or writes to it until the native code finishes. This is not a problem per se it is the right thing to do, but we need to enable -nct when running the haplotype caller and with it have multiple native PairHMM running for each map call. Move to a copy based memory sharing where the JNI simply copies the memory over to C++ and then has no blocked critical memory when running, allowing -nct to work. This version is slightly (almost unnoticeably) slower with -nct 1, but scales better with -nct 2-4 (we haven't tested anything beyond that because we know the GATK falls apart with higher levels of parallelism * Make VECTOR_LOGLESS_CACHING the default implementation for PairHMM. * Changed version number in pom.xml under public/VectorPairHMM * VectorPairHMM can now be compiled using gcc 4.8.x * Modified define-* to get rid of gcc warnings for extra tokens after #undefs * Added a Linux kernel version check for AVX - gcc's __builtin_cpu_supports function does not check whether the kernel supports AVX or not. * Updated PairHMM profiling code to update and print numbers only in single-thread mode * Edited README.md, pom.xml and Makefile for users to pass path to gcc 4.8.x if necessary * Moved all cpuid inline assembly to single function Changed info message to clog from cinfo * Modified version in pom.xml in VectorPairHMM from 3.1 to 3.2 * Deleted some unnecessary code * Modified C++ sandbox to print per interval timing 2014-03-18 02:42:19 +08:00			`template<class NUMBER>`
			`NUMBER compute_full_prob_avxd(testcase tc, NUMBER before_last_log=0);`
			`template<class NUMBER>`
			`NUMBER compute_full_prob_avxs(testcase tc, NUMBER before_last_log=0);`
			`template<class NUMBER>`
			`NUMBER compute_full_prob_ssed(testcase tc, NUMBER before_last_log=0);`
			`template<class NUMBER>`
			`NUMBER compute_full_prob_sses(testcase tc, NUMBER before_last_log=0);`

Added support to transfer haplotypes once per region to the JNI Re-use transferred haplotypes (stored in GlobalRef) across calls to computeLikelihoods 2014-01-23 02:52:41 +08:00			`double getCurrClk();`
1. Split main JNI function into initializeTestcases, compute_testcases and releaseReads 2. FTZ enabled 3. Cleaner profiling code 2014-02-07 06:35:32 +08:00			`void get_time(struct timespec* x);`
Includes code for all debug code for obtaining profiling info 2014-01-31 04:08:06 +08:00			`uint64_t diff_time(struct timespec& prev_time);`
Temporary commit before moving to new native library 2014-01-25 08:29:35 +08:00
1. Added more profiling code 2. Modified JNI_README 2014-01-28 06:32:44 +08:00			`//bit 0 is sse4.2, bit 1 is AVX`
Temporary commit before moving to new native library 2014-01-25 08:29:35 +08:00			`enum ProcessorCapabilitiesEnum`
			`{`
Check only for SSE 4.1 (rather than SSE 4.2) when trying to use the SSE implementation of PairHMM 2014-02-08 07:19:55 +08:00			`SSE41_CUSTOM_IDX=0,`
			`SSE42_CUSTOM_IDX,`
Temporary commit before moving to new native library 2014-01-25 08:29:35 +08:00			`AVX_CUSTOM_IDX`
			`};`
1. Added more profiling code 2. Modified JNI_README 2014-01-28 06:32:44 +08:00			`#define ENABLE_ALL_HARDWARE_FEATURES 0xFFFFFFFFFFFFFFFFull`
Temporary commit before moving to new native library 2014-01-25 08:29:35 +08:00			`uint64_t get_machine_capabilities();`
1. Added more profiling code 2. Modified JNI_README 2014-01-28 06:32:44 +08:00			`void initialize_function_pointers(uint64_t mask=ENABLE_ALL_HARDWARE_FEATURES);`
Minor: added support in C++ sandbox to choose implementation and check from command line 2014-02-10 10:05:35 +08:00			`void do_compute(char* filename, bool use_old_read_testcase=true, unsigned chunk_size=10000, bool do_check=true);`
Followed Khalid's suggestion for packing libVectorLoglessCaching into the jar file with Maven 2014-02-27 02:53:51 +08:00
			`//#define DO_WARMUP`
			`//#define DO_REPEAT_PROFILING`
Removed g_haplotype* global variables in native code so that it works with multi-threading in Java. Modified VectorLoglessPairHMM.java so that jniInitializeRegion and jniFinalizeRegion are empty 2014-03-07 14:08:35 +08:00			`/#define DUMP_COMPUTE_VALUES 1/`
Followed Khalid's suggestion for packing libVectorLoglessCaching into the jar file with Maven 2014-02-27 02:53:51 +08:00			`#define BATCH_SIZE 10000`
			`#define RUN_HYBRID`
Parallel version of the JNI for the PairHMM The JNI treats shared memory as critical memory and doesn't allow any parallel reads or writes to it until the native code finishes. This is not a problem per se it is the right thing to do, but we need to enable -nct when running the haplotype caller and with it have multiple native PairHMM running for each map call. Move to a copy based memory sharing where the JNI simply copies the memory over to C++ and then has no blocked critical memory when running, allowing -nct to work. This version is slightly (almost unnoticeably) slower with -nct 1, but scales better with -nct 2-4 (we haven't tested anything beyond that because we know the GATK falls apart with higher levels of parallelism * Make VECTOR_LOGLESS_CACHING the default implementation for PairHMM. * Changed version number in pom.xml under public/VectorPairHMM * VectorPairHMM can now be compiled using gcc 4.8.x * Modified define-* to get rid of gcc warnings for extra tokens after #undefs * Added a Linux kernel version check for AVX - gcc's __builtin_cpu_supports function does not check whether the kernel supports AVX or not. * Updated PairHMM profiling code to update and print numbers only in single-thread mode * Edited README.md, pom.xml and Makefile for users to pass path to gcc 4.8.x if necessary * Moved all cpuid inline assembly to single function Changed info message to clog from cinfo * Modified version in pom.xml in VectorPairHMM from 3.1 to 3.2 * Deleted some unnecessary code * Modified C++ sandbox to print per interval timing 2014-03-18 02:42:19 +08:00			`/#define PRINT_PER_INTERVAL_TIMINGS 1/`
Followed Khalid's suggestion for packing libVectorLoglessCaching into the jar file with Maven 2014-02-27 02:53:51 +08:00
Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00			`#endif`