Add test files and script

This commit is contained in:
zzh 2025-04-16 22:20:21 +08:00
parent 32920ffe64
commit b0b9efdc66
3 changed files with 13 additions and 4 deletions

View File

@ -7,8 +7,8 @@ Use spdlog as log tool and the default level is 'info'.
### Features ### Features
* Fast - with the same number of threads `FastDup` is ~3.5X faster than GATK MarkDuplicatesSpark. * Fast - with the same number of threads `FastDup` is ~8X faster than GATK MarkDuplicatesSpark.
And `FastDup` achives ~15X performance improvement than Picard MarkDuplicates. And `FastDup` achives ~20X performance improvement than Picard MarkDuplicates.
* Generate identical outputs compared to Picard MarkDuplicates. * Generate identical outputs compared to Picard MarkDuplicates.
* The same detailed metrics data witch Picard MarkDuplicates. * The same detailed metrics data witch Picard MarkDuplicates.
* All data processed in memory and low-memory footprint even for large input files. * All data processed in memory and low-memory footprint even for large input files.
@ -42,6 +42,7 @@ Use spdlog as log tool and the default level is 'info'.
* libbz2 * libbz2
* liblzma * liblzma
* libcurl * libcurl
* OpenSSL
* libdeflate (optional) * libdeflate (optional)
## Install ## Install
@ -69,11 +70,11 @@ The generated binary fastdup will be in the build/bin folder.
1. get help 1. get help
```bash ```bash
fastdup --help ./fastdup --help
``` ```
2. mark duplicates on an input BAM file using 8 threads 2. mark duplicates on an input BAM file using 8 threads
```bash ```bash
fastdup --input in.bam --output out.bam --metrics stats.txt --num-threads 8 ./fastdup --input in_test.bam --output out_md.bam --metrics stats.txt --num-threads 8
``` ```

View File

@ -84,6 +84,14 @@ else()
message(FATAL_ERROR "lm is not found") message(FATAL_ERROR "lm is not found")
endif() endif()
# ssl
find_package(OpenSSL REQUIRED)
if(OpenSSL_FOUND)
target_link_libraries(${PG_NAME} OpenSSL::SSL OpenSSL::Crypto)
else()
message(FATAL_ERROR "OpenSSL is not found")
endif()
# install path # install path
install(TARGETS ${PG_NAME} install(TARGETS ${PG_NAME}
RUNTIME DESTINATION bin RUNTIME DESTINATION bin

BIN
test/in_test.bam 100644

Binary file not shown.