gatk-3.8/public/VectorPairHMM/src/main/c++/Makefile

/*Copyright (c) 2012 The Broad Institute

*Permission is hereby granted, free of charge, to any person
*obtaining a copy of this software and associated documentation
*files (the "Software"), to deal in the Software without
*restriction, including without limitation the rights to use,
*copy, modify, merge, publish, distribute, sublicense, and/or sell
*copies of the Software, and to permit persons to whom the
*Software is furnished to do so, subject to the following
*conditions:

*The above copyright notice and this permission notice shall be
*included in all copies or substantial portions of the Software.

*THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
*EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
*OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
*NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
*HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
*WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
*FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR
*THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*/


#OMPCFLAGS=-fopenmp
#OMPLFLAGS=-fopenmp #-openmp-link static

#CFLAGS=-O2 -std=c++11 -W -Wall -march=corei7-avx -Wa,-q            -pedantic $(OMPCFLAGS) -Wno-unknown-pragmas
#CFLAGS=-O2             -W -Wall -march=corei7 -mfpmath=sse -msse4.2 -pedantic $(OMPCFLAGS) -Wno-unknown-pragmas

JRE_HOME?=/opt/jdk1.7.0_25/jre
JNI_COMPILATION_FLAGS=-D_REENTRANT -fPIC -I${JRE_HOME}/../include -I${JRE_HOME}/../include/linux

COMMON_COMPILATION_FLAGS=$(JNI_COMPILATION_FLAGS) -O3 -W -Wall -pedantic $(OMPCFLAGS) -Wno-unknown-pragmas
CC=icc
CXX=icc

LDFLAGS=-lm -lrt $(OMPLDFLAGS)
ifdef DISABLE_FTZ
  COMMON_COMPILATION_FLAGS+=-DDISABLE_FTZ -no-ftz
endif

PAPI_DIR=/home/karthikg/softwares/papi-5.3.0
ifdef USE_PAPI
  ifeq ($(USE_PAPI),1)
    COMMON_COMPILATION_FLAGS+=-I$(PAPI_DIR)/include -DUSE_PAPI
    LDFLAGS+=-L$(PAPI_DIR)/lib -lpapi
  endif
endif

ifdef DISABLE_FTZ
  COMMON_COMPILATION_FLAGS+=-DDISABLE_FTZ -no-ftz
endif

BIN=libVectorLoglessPairHMM.so pairhmm-template-main checker
#BIN=checker

DEPDIR=.deps
DF=$(DEPDIR)/$(*).d

#Common across libJNI and sandbox
COMMON_SOURCES=utils.cc avx_function_instantiations.cc baseline.cc sse_function_instantiations.cc LoadTimeInitializer.cc
#Part of libJNI
LIBSOURCES=org_broadinstitute_sting_utils_pairhmm_VectorLoglessPairHMM.cc org_broadinstitute_sting_utils_pairhmm_DebugJNILoglessPairHMM.cc Sandbox.cc $(COMMON_SOURCES)
SOURCES=$(LIBSOURCES) pairhmm-template-main.cc pairhmm-1-base.cc
LIBOBJECTS=$(LIBSOURCES:.cc=.o)
COMMON_OBJECTS=$(COMMON_SOURCES:.cc=.o)


#No vectorization for these files
NO_VECTOR_SOURCES=org_broadinstitute_sting_utils_pairhmm_VectorLoglessPairHMM.cc org_broadinstitute_sting_utils_pairhmm_DebugJNILoglessPairHMM.cc pairhmm-template-main.cc pairhmm-1-base.cc utils.cc baseline.cc LoadTimeInitializer.cc Sandbox.cc
#Use -xAVX for these files
AVX_SOURCES=avx_function_instantiations.cc
#Use -xSSE4.2 for these files
SSE_SOURCES=sse_function_instantiations.cc

NO_VECTOR_OBJECTS=$(NO_VECTOR_SOURCES:.cc=.o)
AVX_OBJECTS=$(AVX_SOURCES:.cc=.o)
SSE_OBJECTS=$(SSE_SOURCES:.cc=.o)
$(NO_VECTOR_OBJECTS): CXXFLAGS=$(COMMON_COMPILATION_FLAGS)
$(AVX_OBJECTS): CXXFLAGS=$(COMMON_COMPILATION_FLAGS) -xAVX
$(SSE_OBJECTS): CXXFLAGS=$(COMMON_COMPILATION_FLAGS) -xSSE4.2
OBJECTS=$(NO_VECTOR_OBJECTS) $(AVX_OBJECTS) $(SSE_OBJECTS)

all: $(BIN) Sandbox.class copied_lib

-include $(addprefix $(DEPDIR)/,$(SOURCES:.cc=.d))

checker: pairhmm-1-base.o $(COMMON_OBJECTS)
	$(CXX) $(OMPLFLAGS) -o $@ $^ $(LDFLAGS)

pairhmm-template-main:	pairhmm-template-main.o $(COMMON_OBJECTS)
	$(CXX) $(OMPLFLAGS) -o $@ $^ $(LDFLAGS)

libVectorLoglessPairHMM.so: $(LIBOBJECTS) 
	$(CXX) $(OMPLFLAGS) -shared -static-intel -o $@ $(LIBOBJECTS) ${LDFLAGS}


$(OBJECTS): %.o: %.cc
	@mkdir -p $(DEPDIR)
	$(CXX) -c -MMD -MF $(DF) $(CXXFLAGS) $(OUTPUT_OPTION) $<

Sandbox.class: Sandbox.java
	javac Sandbox.java

copied_lib: libVectorLoglessPairHMM.so
ifdef OUTPUT_DIR
	mkdir -p $(OUTPUT_DIR)
	rsync -a libVectorLoglessPairHMM.so $(OUTPUT_DIR)/
endif

clean:
	rm -rf $(BIN) *.o $(DEPDIR) *.class
Added public license text to all C++ files 2014-03-04 01:04:00 +08:00			`/*Copyright (c) 2012 The Broad Institute`

			`*Permission is hereby granted, free of charge, to any person`
			`*obtaining a copy of this software and associated documentation`
			`*files (the "Software"), to deal in the Software without`
			`*restriction, including without limitation the rights to use,`
			`*copy, modify, merge, publish, distribute, sublicense, and/or sell`
			`*copies of the Software, and to permit persons to whom the`
			`*Software is furnished to do so, subject to the following`
			`*conditions:`

			`*The above copyright notice and this permission notice shall be`
			`*included in all copies or substantial portions of the Software.`

			`*THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,`
			`*EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES`
			`*OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND`
			`*NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT`
			`*HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,`
			`*WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING`
			`*FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR`
			`*THE USE OR OTHER DEALINGS IN THE SOFTWARE.`
			`*/`


1. Converted q,i,d,c in C++ from int* to char* 2. Use clock_gettime to measure performance 3. Disabled OpenMP 4. Moved LoadTimeInitializer to different file 2014-01-23 14:57:32 +08:00			`#OMPCFLAGS=-fopenmp`
			`#OMPLFLAGS=-fopenmp #-openmp-link static`
First import of AVX-JNI to git 2014-01-15 09:26:55 +08:00
			`#CFLAGS=-O2 -std=c++11 -W -Wall -march=corei7-avx -Wa,-q -pedantic $(OMPCFLAGS) -Wno-unknown-pragmas`
			`#CFLAGS=-O2 -W -Wall -march=corei7 -mfpmath=sse -msse4.2 -pedantic $(OMPCFLAGS) -Wno-unknown-pragmas`

1. Changed logger.info to logger.warn in PairHMMLikelihoodCalculationEngine.java 2. Committing the right set of files after rebase 2014-03-01 08:08:28 +08:00			`JRE_HOME?=/opt/jdk1.7.0_25/jre`
1. Renamed directory structure from public/c++/VectorPairHMM to public/VectorPairHMM/src/main/c++ as per Khalid's suggestion 2. Use java.home in public/VectorPairHMM/pom.xml to pass environment variable JRE_HOME to the make process. This is needed because the Makefile needs to compile JNI code with the flag -I<JRE_HOME>/../include (among others). Assuming that the Maven build process uses a JDK (and not just a JRE), the variable java.home points to the JRE inside maven. 3. Dropped all pretense at cross-platform compatibility. Removed Mac profile from pom.xml for VectorPairHMM 2014-02-27 07:17:15 +08:00			`JNI_COMPILATION_FLAGS=-D_REENTRANT -fPIC -I${JRE_HOME}/../include -I${JRE_HOME}/../include/linux`
First import of AVX-JNI to git 2014-01-15 09:26:55 +08:00
Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00			`COMMON_COMPILATION_FLAGS=$(JNI_COMPILATION_FLAGS) -O3 -W -Wall -pedantic $(OMPCFLAGS) -Wno-unknown-pragmas`
First import of AVX-JNI to git 2014-01-15 09:26:55 +08:00			`CC=icc`
			`CXX=icc`

1. Converted q,i,d,c in C++ from int* to char* 2. Use clock_gettime to measure performance 3. Disabled OpenMP 4. Moved LoadTimeInitializer to different file 2014-01-23 14:57:32 +08:00			`LDFLAGS=-lm -lrt $(OMPLDFLAGS)`
1. Enabled FTZ in LoadTimeInitializer.cc 2. Added Sandbox.java for testing 3. Moved compute to utils.cc (inside library) 4. Added flag for disabling FTZ in Makefile 2014-02-07 03:01:33 +08:00			`ifdef DISABLE_FTZ`
			`COMMON_COMPILATION_FLAGS+=-DDISABLE_FTZ -no-ftz`
			`endif`
First import of AVX-JNI to git 2014-01-15 09:26:55 +08:00
Contains profiling, exception tracking, PAPI code Contains Sandbox Java 2014-02-05 08:27:29 +08:00			`PAPI_DIR=/home/karthikg/softwares/papi-5.3.0`
			`ifdef USE_PAPI`
			`ifeq ($(USE_PAPI),1)`
1. Whew, finally debugged the source of performance issues with PairHMM JNI. See copied text from email below. 2. This commit contains all the code used in profiling, detecting FP exceptions, dumping intermediate results. All flagged off using ifdefs, but it's there. --------------Text from email As we discussed before, it's the denormal numbers that are causing the slowdown - the core executes some microcode uops (called FP assists) when denormal numbers are detected for FP operations (even un-vectorized code). The C++ compiler by default enables flush to zero (FTZ) - when set, the hardware simply converts denormal numbers to 0. The Java binary (executable provided by Oracle, not the native library) seems to be compiled without FTZ (sensible choice, they want to be conservative). Hence, the JNI invocation sees a large slowdown. Disabling FTZ in C++ slows down the C++ sandbox performance to the JNI version (fortunately, the reverse also holds :)). Not sure how to show the overhead for these FP assists easily - measured a couple of counters. FP_ASSISTS:ANY - shows number of uops executed as part of the FP assists. When FTZ is enabled, this is 0 (both C++ and JNI), when FTZ is disabled this value is around 203540557 (both C++ and JNI) IDQ:MS_UOPS_CYCLES - shows the number of cycles the decoder was issuing uops when the microcode sequencing engine was busy. When FTZ is enabled, this is around 1.77M cycles (both C++ and JNI), when FTZ is disabled this value is around 4.31B cycles (both C++ and JNI). This number is still small with respect to total cycles (~40B), but it only reflects the cycles in the decode stage. The total overhead of the microcode assist ops could be larger. As suggested by Mustafa, I compared intermediate values (matrices M,X,Y) and final output of compute_full_prob. The values produced by C++ and Java are identical to the last bit (as long as both use FTZ or no-FTZ). Comparing the outputs of compute_full_prob for the cases no-FTZ and FTZ, there are differences for very small values (denormal numbers). Examples: Diff values 1.952970E-33 1.952967E-33 Diff values 1.135071E-32 1.135070E-32 Diff values 1.135071E-32 1.135070E-32 Diff values 1.135071E-32 1.135070E-32 For this test case (low coverage NA12878), all these values would be recomputed using the double precision version. Enabling FTZ should be fine. -------------------End text from email 2014-02-06 09:09:57 +08:00			`COMMON_COMPILATION_FLAGS+=-I$(PAPI_DIR)/include -DUSE_PAPI`
Contains profiling, exception tracking, PAPI code Contains Sandbox Java 2014-02-05 08:27:29 +08:00			`LDFLAGS+=-L$(PAPI_DIR)/lib -lpapi`
			`endif`
			`endif`

1. Whew, finally debugged the source of performance issues with PairHMM JNI. See copied text from email below. 2. This commit contains all the code used in profiling, detecting FP exceptions, dumping intermediate results. All flagged off using ifdefs, but it's there. --------------Text from email As we discussed before, it's the denormal numbers that are causing the slowdown - the core executes some microcode uops (called FP assists) when denormal numbers are detected for FP operations (even un-vectorized code). The C++ compiler by default enables flush to zero (FTZ) - when set, the hardware simply converts denormal numbers to 0. The Java binary (executable provided by Oracle, not the native library) seems to be compiled without FTZ (sensible choice, they want to be conservative). Hence, the JNI invocation sees a large slowdown. Disabling FTZ in C++ slows down the C++ sandbox performance to the JNI version (fortunately, the reverse also holds :)). Not sure how to show the overhead for these FP assists easily - measured a couple of counters. FP_ASSISTS:ANY - shows number of uops executed as part of the FP assists. When FTZ is enabled, this is 0 (both C++ and JNI), when FTZ is disabled this value is around 203540557 (both C++ and JNI) IDQ:MS_UOPS_CYCLES - shows the number of cycles the decoder was issuing uops when the microcode sequencing engine was busy. When FTZ is enabled, this is around 1.77M cycles (both C++ and JNI), when FTZ is disabled this value is around 4.31B cycles (both C++ and JNI). This number is still small with respect to total cycles (~40B), but it only reflects the cycles in the decode stage. The total overhead of the microcode assist ops could be larger. As suggested by Mustafa, I compared intermediate values (matrices M,X,Y) and final output of compute_full_prob. The values produced by C++ and Java are identical to the last bit (as long as both use FTZ or no-FTZ). Comparing the outputs of compute_full_prob for the cases no-FTZ and FTZ, there are differences for very small values (denormal numbers). Examples: Diff values 1.952970E-33 1.952967E-33 Diff values 1.135071E-32 1.135070E-32 Diff values 1.135071E-32 1.135070E-32 Diff values 1.135071E-32 1.135070E-32 For this test case (low coverage NA12878), all these values would be recomputed using the double precision version. Enabling FTZ should be fine. -------------------End text from email 2014-02-06 09:09:57 +08:00			`ifdef DISABLE_FTZ`
			`COMMON_COMPILATION_FLAGS+=-DDISABLE_FTZ -no-ftz`
			`endif`

1. Cleaned up code 2. Split into DebugJNILoglessPairHMM and VectorLoglessPairHMM with base class JNILoglessPairHMM. DebugJNILoglessPairHMM can, in principle, invoke any other child class of JNILoglessPairHMM. 3. Added more profiling code for Java parts of LoglessPairHMM 2014-01-27 11:18:12 +08:00			`BIN=libVectorLoglessPairHMM.so pairhmm-template-main checker`
Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00			`#BIN=checker`
First import of AVX-JNI to git 2014-01-15 09:26:55 +08:00
			`DEPDIR=.deps`
			`DF=$(DEPDIR)/$(*).d`

Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00			`#Common across libJNI and sandbox`
Added support to transfer haplotypes once per region to the JNI Re-use transferred haplotypes (stored in GlobalRef) across calls to computeLikelihoods 2014-01-23 02:52:41 +08:00			`COMMON_SOURCES=utils.cc avx_function_instantiations.cc baseline.cc sse_function_instantiations.cc LoadTimeInitializer.cc`
Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00			`#Part of libJNI`
Contains profiling, exception tracking, PAPI code Contains Sandbox Java 2014-02-05 08:27:29 +08:00			`LIBSOURCES=org_broadinstitute_sting_utils_pairhmm_VectorLoglessPairHMM.cc org_broadinstitute_sting_utils_pairhmm_DebugJNILoglessPairHMM.cc Sandbox.cc $(COMMON_SOURCES)`
Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00			`SOURCES=$(LIBSOURCES) pairhmm-template-main.cc pairhmm-1-base.cc`
			`LIBOBJECTS=$(LIBSOURCES:.cc=.o)`
			`COMMON_OBJECTS=$(COMMON_SOURCES:.cc=.o)`


			`#No vectorization for these files`
Contains profiling, exception tracking, PAPI code Contains Sandbox Java 2014-02-05 08:27:29 +08:00			`NO_VECTOR_SOURCES=org_broadinstitute_sting_utils_pairhmm_VectorLoglessPairHMM.cc org_broadinstitute_sting_utils_pairhmm_DebugJNILoglessPairHMM.cc pairhmm-template-main.cc pairhmm-1-base.cc utils.cc baseline.cc LoadTimeInitializer.cc Sandbox.cc`
Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00			`#Use -xAVX for these files`
			`AVX_SOURCES=avx_function_instantiations.cc`
			`#Use -xSSE4.2 for these files`
1. Integrated Mohammad's SSE4.2 code, Mustafa's bug fix and code to fix the SSE compilation warning. 2. Added code to dynamically select between AVX, SSE4.2 and normal C++ (in that order) 3. Created multiple files to compile with different compilation flags: avx_function_prototypes.cc is compiled with -xAVX while sse_function_instantiations.cc is compiled with -xSSE4.2 flag. 4. Added jniClose() and support in Java (HaplotypeCaller, PairHMMLikelihoodCalculationEngine) to call this function at the end of the program. 5. Removed debug code, kept assertions and profiling in C++ 6. Disabled OpenMP for now. 2014-01-21 00:03:42 +08:00			`SSE_SOURCES=sse_function_instantiations.cc`
Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00
			`NO_VECTOR_OBJECTS=$(NO_VECTOR_SOURCES:.cc=.o)`
			`AVX_OBJECTS=$(AVX_SOURCES:.cc=.o)`
			`SSE_OBJECTS=$(SSE_SOURCES:.cc=.o)`
			`$(NO_VECTOR_OBJECTS): CXXFLAGS=$(COMMON_COMPILATION_FLAGS)`
			`$(AVX_OBJECTS): CXXFLAGS=$(COMMON_COMPILATION_FLAGS) -xAVX`
			`$(SSE_OBJECTS): CXXFLAGS=$(COMMON_COMPILATION_FLAGS) -xSSE4.2`
			`OBJECTS=$(NO_VECTOR_OBJECTS) $(AVX_OBJECTS) $(SSE_OBJECTS)`

Followed Khalid's suggestion for packing libVectorLoglessCaching into the jar file with Maven 2014-02-27 02:53:51 +08:00			`all: $(BIN) Sandbox.class copied_lib`
First import of AVX-JNI to git 2014-01-15 09:26:55 +08:00
			`-include $(addprefix $(DEPDIR)/,$(SOURCES:.cc=.d))`

Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00			`checker: pairhmm-1-base.o $(COMMON_OBJECTS)`
Added support to transfer haplotypes once per region to the JNI Re-use transferred haplotypes (stored in GlobalRef) across calls to computeLikelihoods 2014-01-23 02:52:41 +08:00			`$(CXX) $(OMPLFLAGS) -o $@ $^ $(LDFLAGS)`
1. Nested loops over reads and haplotypes moved to C++ through JNI 2. OpenMP support added 3. Using direct access to Java primitive arrays 4. Debug messages disabled 2014-01-17 11:53:50 +08:00
Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00			`pairhmm-template-main: pairhmm-template-main.o $(COMMON_OBJECTS)`
Added support to transfer haplotypes once per region to the JNI Re-use transferred haplotypes (stored in GlobalRef) across calls to computeLikelihoods 2014-01-23 02:52:41 +08:00			`$(CXX) $(OMPLFLAGS) -o $@ $^ $(LDFLAGS)`
First import of AVX-JNI to git 2014-01-15 09:26:55 +08:00
1. Cleaned up code 2. Split into DebugJNILoglessPairHMM and VectorLoglessPairHMM with base class JNILoglessPairHMM. DebugJNILoglessPairHMM can, in principle, invoke any other child class of JNILoglessPairHMM. 3. Added more profiling code for Java parts of LoglessPairHMM 2014-01-27 11:18:12 +08:00			`libVectorLoglessPairHMM.so: $(LIBOBJECTS)`
Includes code for all debug code for obtaining profiling info 2014-01-31 04:08:06 +08:00			`$(CXX) $(OMPLFLAGS) -shared -static-intel -o $@ $(LIBOBJECTS) ${LDFLAGS}`
First import of AVX-JNI to git 2014-01-15 09:26:55 +08:00
Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00
			`$(OBJECTS): %.o: %.cc`
First import of AVX-JNI to git 2014-01-15 09:26:55 +08:00			`@mkdir -p $(DEPDIR)`
Added support for dynamic selection between AVX and un-vectorized C++, still to include SSE code from Mohammad. Debug flags turned on in this commit. 2014-01-19 03:07:23 +08:00			`$(CXX) -c -MMD -MF $(DF) $(CXXFLAGS) $(OUTPUT_OPTION) $<`
First import of AVX-JNI to git 2014-01-15 09:26:55 +08:00
Contains profiling, exception tracking, PAPI code Contains Sandbox Java 2014-02-05 08:27:29 +08:00			`Sandbox.class: Sandbox.java`
			`javac Sandbox.java`
First import of AVX-JNI to git 2014-01-15 09:26:55 +08:00
Followed Khalid's suggestion for packing libVectorLoglessCaching into the jar file with Maven 2014-02-27 02:53:51 +08:00			`copied_lib: libVectorLoglessPairHMM.so`
			`ifdef OUTPUT_DIR`
			`mkdir -p $(OUTPUT_DIR)`
			`rsync -a libVectorLoglessPairHMM.so $(OUTPUT_DIR)/`
			`endif`

First import of AVX-JNI to git 2014-01-15 09:26:55 +08:00			`clean:`
Contains profiling, exception tracking, PAPI code Contains Sandbox Java 2014-02-05 08:27:29 +08:00			`rm -rf $(BIN) .o $(DEPDIR) .class`