2009-03-18 07:22:37 +08:00
|
|
|
package org.broadinstitute.sting.gatk;
|
|
|
|
|
|
2009-07-22 02:32:22 +08:00
|
|
|
import java.util.*;
|
2009-03-18 07:22:37 +08:00
|
|
|
|
2009-07-10 07:59:53 +08:00
|
|
|
import org.broadinstitute.sting.gatk.walkers.*;
|
2009-05-20 07:26:17 +08:00
|
|
|
import org.broadinstitute.sting.gatk.refdata.ReferenceOrderedDatum;
|
|
|
|
|
import org.broadinstitute.sting.gatk.refdata.ReferenceOrderedData;
|
2009-05-16 05:02:12 +08:00
|
|
|
import org.broadinstitute.sting.utils.StingException;
|
2009-07-22 02:32:22 +08:00
|
|
|
import org.broadinstitute.sting.utils.PackageUtils;
|
2009-03-27 21:27:04 +08:00
|
|
|
import org.apache.log4j.Logger;
|
2009-07-10 07:59:53 +08:00
|
|
|
import net.sf.picard.filter.SamRecordFilter;
|
2009-03-18 07:22:37 +08:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Created by IntelliJ IDEA.
|
|
|
|
|
* User: hanna
|
|
|
|
|
* Date: Mar 17, 2009
|
|
|
|
|
* Time: 3:14:28 PM
|
|
|
|
|
* To change this template use File | Settings | File Templates.
|
|
|
|
|
*/
|
|
|
|
|
public class WalkerManager {
|
|
|
|
|
|
2009-03-27 21:27:04 +08:00
|
|
|
/**
|
|
|
|
|
* our log, which we want to capture anything from this class
|
|
|
|
|
*/
|
|
|
|
|
private static Logger logger = Logger.getLogger(WalkerManager.class);
|
|
|
|
|
|
2009-05-28 09:35:49 +08:00
|
|
|
private Map<String, Class<? extends Walker>> walkersByName;
|
2009-03-27 21:27:04 +08:00
|
|
|
|
2009-07-22 02:32:22 +08:00
|
|
|
public WalkerManager() {
|
|
|
|
|
List<Class<? extends Walker>> walkers = PackageUtils.getClassesImplementingInterface(Walker.class);
|
|
|
|
|
walkersByName = createWalkerDatabase(walkers);
|
2009-03-18 07:22:37 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Does a walker with the given name exist?
|
2009-03-27 21:27:04 +08:00
|
|
|
*
|
2009-03-18 07:22:37 +08:00
|
|
|
* @param walkerName Name of the walker for which to search.
|
|
|
|
|
* @return True if the walker exists, false otherwise.
|
|
|
|
|
*/
|
|
|
|
|
public boolean doesWalkerExist(String walkerName) {
|
2009-05-28 09:35:49 +08:00
|
|
|
return walkersByName.containsKey(walkerName);
|
2009-03-18 07:22:37 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Gets a walker with the given name, or null if no walker exists.
|
2009-03-27 21:27:04 +08:00
|
|
|
*
|
2009-03-18 07:22:37 +08:00
|
|
|
* @param walkerName Name of the walker to retrieve.
|
|
|
|
|
* @return The walker object if found; null otherwise.
|
|
|
|
|
*/
|
2009-03-27 04:45:27 +08:00
|
|
|
public Walker createWalkerByName(String walkerName)
|
|
|
|
|
throws InstantiationException, IllegalAccessException {
|
2009-05-28 09:35:49 +08:00
|
|
|
Class<? extends Walker> walker = walkersByName.get(walkerName);
|
2009-07-17 06:02:21 +08:00
|
|
|
if( walker == null )
|
|
|
|
|
throw new StingException(String.format("Could not find walker with name: %s", walkerName));
|
2009-05-28 09:35:49 +08:00
|
|
|
return walker.newInstance();
|
2009-03-27 04:45:27 +08:00
|
|
|
}
|
|
|
|
|
|
2009-05-16 05:02:12 +08:00
|
|
|
/**
|
|
|
|
|
* Retrieves the walker class given a walker name.
|
|
|
|
|
* @param walkerName Name of the walker.
|
|
|
|
|
* @return Class representing the walker.
|
|
|
|
|
*/
|
2009-03-27 21:27:04 +08:00
|
|
|
public Class getWalkerClassByName(String walkerName) {
|
2009-05-28 09:35:49 +08:00
|
|
|
return walkersByName.get(walkerName);
|
2009-03-18 07:22:37 +08:00
|
|
|
}
|
|
|
|
|
|
2009-05-16 05:02:12 +08:00
|
|
|
/**
|
|
|
|
|
* Gets the data source for the provided walker.
|
|
|
|
|
* @param walker The walker.
|
|
|
|
|
* @return Which type of data source to traverse over...reads or reference?
|
|
|
|
|
*/
|
|
|
|
|
public static DataSource getWalkerDataSource(Walker walker) {
|
|
|
|
|
Class<? extends Walker> walkerClass = walker.getClass();
|
|
|
|
|
By byDataSource = walkerClass.getAnnotation(By.class);
|
|
|
|
|
if( byDataSource == null )
|
|
|
|
|
throw new StingException("Unable to find By annotation for walker class " + walkerClass.getName());
|
|
|
|
|
return byDataSource.value();
|
|
|
|
|
}
|
|
|
|
|
|
2009-05-20 07:26:17 +08:00
|
|
|
/**
|
|
|
|
|
* Determine whether the given walker supports the given data source.
|
|
|
|
|
* @param walker Walker to query.
|
|
|
|
|
* @param dataSource Source to check for .
|
|
|
|
|
* @return True if the walker forbids this data type. False otherwise.
|
|
|
|
|
*/
|
|
|
|
|
public static boolean isAllowed(Walker walker, DataSource dataSource) {
|
|
|
|
|
Allows allowsDataSource = getWalkerAllowed(walker);
|
|
|
|
|
|
|
|
|
|
// Allows is less restrictive than requires. If an allows
|
|
|
|
|
// clause is not specified, any kind of data is allowed.
|
|
|
|
|
if( allowsDataSource == null )
|
|
|
|
|
return true;
|
|
|
|
|
|
|
|
|
|
return Arrays.asList(allowsDataSource.value()).contains(dataSource);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Determine whether the given walker supports the given reference ordered data.
|
|
|
|
|
* @param walker Walker to query.
|
|
|
|
|
* @param rod Source to check.
|
|
|
|
|
* @return True if the walker forbids this data type. False otherwise.
|
|
|
|
|
*/
|
|
|
|
|
public static boolean isAllowed(Walker walker, ReferenceOrderedData<? extends ReferenceOrderedDatum> rod) {
|
|
|
|
|
Allows allowsDataSource = getWalkerAllowed(walker);
|
|
|
|
|
|
|
|
|
|
// Allows is less restrictive than requires. If an allows
|
|
|
|
|
// clause is not specified, any kind of data is allowed.
|
|
|
|
|
if( allowsDataSource == null )
|
|
|
|
|
return true;
|
|
|
|
|
|
|
|
|
|
// The difference between unspecified RMD and the empty set of metadata can't be detected.
|
|
|
|
|
// Treat an empty 'allows' as 'allow everything'. Maybe we can have a special RMD flag to account for this
|
|
|
|
|
// case in the future.
|
|
|
|
|
if( allowsDataSource.referenceMetaData().length == 0 )
|
|
|
|
|
return true;
|
|
|
|
|
|
|
|
|
|
for( RMD allowed: allowsDataSource.referenceMetaData() ) {
|
|
|
|
|
if( rod.matches(allowed.name(),allowed.type()) )
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Determine whether the given walker requires the given data source.
|
|
|
|
|
* @param walker Walker to query.
|
|
|
|
|
* @param dataSource Source to check for.
|
|
|
|
|
* @return True if the walker allows this data type. False otherwise.
|
|
|
|
|
*/
|
|
|
|
|
public static boolean isRequired(Walker walker, DataSource dataSource) {
|
|
|
|
|
Requires requiresDataSource = getWalkerRequirements(walker);
|
|
|
|
|
return Arrays.asList(requiresDataSource.value()).contains(dataSource);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Get a list of RODs required by the walker.
|
|
|
|
|
* @param walker Walker to query.
|
|
|
|
|
* @return True if the walker allows this data type. False otherwise.
|
|
|
|
|
*/
|
|
|
|
|
public static List<RMD> getRequiredMetaData(Walker walker) {
|
|
|
|
|
Requires requiresDataSource = getWalkerRequirements(walker);
|
|
|
|
|
return Arrays.asList(requiresDataSource.referenceMetaData());
|
|
|
|
|
}
|
|
|
|
|
|
2009-07-10 07:59:53 +08:00
|
|
|
/**
|
|
|
|
|
* Extracts filters that the walker has requested be run on the dataset.
|
|
|
|
|
* @param walker Walker to inspect for filtering requests.
|
|
|
|
|
* @return A non-empty list of filters to apply to the reads.
|
|
|
|
|
*/
|
|
|
|
|
public static List<SamRecordFilter> getReadFilters(Walker walker) {
|
|
|
|
|
Class<? extends SamRecordFilter>[] filterTypes = getReadFilterTypes(walker);
|
|
|
|
|
List<SamRecordFilter> filters = new ArrayList<SamRecordFilter>();
|
|
|
|
|
|
|
|
|
|
for( Class<? extends SamRecordFilter> filterType: filterTypes ) {
|
|
|
|
|
try {
|
|
|
|
|
filters.add(filterType.newInstance());
|
|
|
|
|
}
|
|
|
|
|
catch( InstantiationException ex ) {
|
|
|
|
|
throw new StingException("Unable to instantiate filter: " + filterType, ex);
|
|
|
|
|
}
|
|
|
|
|
catch( IllegalAccessException ex ) {
|
|
|
|
|
throw new StingException("Unable to access filter: " + filterType, ex);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return filters;
|
|
|
|
|
}
|
|
|
|
|
|
2009-03-18 07:22:37 +08:00
|
|
|
/**
|
|
|
|
|
* Instantiate the list of walker classes. Add them to the walker hashmap.
|
2009-03-27 21:27:04 +08:00
|
|
|
*
|
2009-03-18 07:22:37 +08:00
|
|
|
* @param walkerClasses Classes to instantiate.
|
2009-03-27 04:45:27 +08:00
|
|
|
* @return map of walker name to walker.
|
2009-03-18 07:22:37 +08:00
|
|
|
*/
|
2009-05-28 09:35:49 +08:00
|
|
|
private Map<String, Class<? extends Walker>> createWalkerDatabase(List<Class<? extends Walker>> walkerClasses) {
|
|
|
|
|
Map<String, Class<? extends Walker>> walkers = new HashMap<String, Class<? extends Walker>>();
|
2009-03-18 07:22:37 +08:00
|
|
|
|
2009-05-28 09:35:49 +08:00
|
|
|
for (Class<? extends Walker> walkerClass : walkerClasses) {
|
2009-03-27 21:27:04 +08:00
|
|
|
String walkerName = getWalkerName(walkerClass);
|
2009-03-27 21:44:46 +08:00
|
|
|
logger.info(String.format("* Adding module %s", walkerName));
|
2009-03-27 21:27:04 +08:00
|
|
|
walkers.put(walkerName, walkerClass);
|
2009-03-18 07:22:37 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return walkers;
|
|
|
|
|
}
|
2009-03-27 04:45:27 +08:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Create a name for this type of walker.
|
2009-03-27 21:27:04 +08:00
|
|
|
*
|
2009-03-27 04:45:27 +08:00
|
|
|
* @param walkerType The type of walker.
|
|
|
|
|
* @return A name for this type of walker.
|
|
|
|
|
*/
|
2009-05-20 07:26:17 +08:00
|
|
|
public static String getWalkerName(Class<? extends Walker> walkerType) {
|
2009-03-27 04:45:27 +08:00
|
|
|
String walkerName = "";
|
|
|
|
|
|
2009-03-27 21:27:04 +08:00
|
|
|
if (walkerType.getAnnotation(WalkerName.class) != null)
|
|
|
|
|
walkerName = walkerType.getAnnotation(WalkerName.class).value().trim();
|
2009-03-27 04:45:27 +08:00
|
|
|
|
2009-03-27 21:27:04 +08:00
|
|
|
if (walkerName.length() == 0) {
|
2009-03-27 04:45:27 +08:00
|
|
|
walkerName = walkerType.getSimpleName();
|
2009-03-27 21:27:04 +08:00
|
|
|
if (walkerName.endsWith("Walker"))
|
|
|
|
|
walkerName = walkerName.substring(0, walkerName.lastIndexOf("Walker"));
|
2009-03-27 04:45:27 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return walkerName;
|
|
|
|
|
}
|
2009-05-20 07:26:17 +08:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Utility to get the requires attribute from the walker.
|
|
|
|
|
* Throws an exception if requirements are missing.
|
|
|
|
|
* @param walker Walker to query for required data.
|
|
|
|
|
* @return Required data attribute.
|
|
|
|
|
*/
|
|
|
|
|
private static Requires getWalkerRequirements(Walker walker) {
|
|
|
|
|
Class<? extends Walker> walkerClass = walker.getClass();
|
|
|
|
|
Requires requiresDataSource = walkerClass.getAnnotation(Requires.class);
|
|
|
|
|
if( requiresDataSource == null )
|
|
|
|
|
throw new StingException( "Unable to find data types required by walker class " + walkerClass.getName());
|
|
|
|
|
return requiresDataSource;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Utility to get the forbidden attribute from the walker.
|
|
|
|
|
* @param walker Walker to query for required data.
|
|
|
|
|
* @return Required data attribute. Null if forbidden info isn't present.
|
|
|
|
|
*/
|
|
|
|
|
private static Allows getWalkerAllowed(Walker walker) {
|
|
|
|
|
Class<? extends Walker> walkerClass = walker.getClass();
|
|
|
|
|
Allows allowsDataSource = walkerClass.getAnnotation(Allows.class);
|
|
|
|
|
return allowsDataSource;
|
|
|
|
|
}
|
2009-07-10 07:59:53 +08:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Gets the list of filtering classes specified as walker annotations.
|
|
|
|
|
* @param walker The walker to inspect.
|
|
|
|
|
* @return An array of types extending from SamRecordFilter. Will never be null.
|
|
|
|
|
*/
|
|
|
|
|
private static Class<? extends SamRecordFilter>[] getReadFilterTypes(Walker walker) {
|
|
|
|
|
Class<? extends Walker> walkerClass = walker.getClass();
|
|
|
|
|
if( !walkerClass.isAnnotationPresent(ReadFilters.class) )
|
|
|
|
|
return new Class[0];
|
|
|
|
|
return walkerClass.getAnnotation(ReadFilters.class).value();
|
|
|
|
|
}
|
2009-03-18 07:22:37 +08:00
|
|
|
}
|