/* * Eoulsan development code * * This code may be freely distributed and modified under the * terms of the GNU Lesser General Public License version 2.1 or * later and CeCILL-C. This should be distributed with the code. * If you do not have a copy, see: * * http://www.gnu.org/licenses/lgpl-2.1.txt * http://www.cecill.info/licences/Licence_CeCILL-C_V1-en.txt * * Copyright for this code is held jointly by the Genomic platform * of the Institut de Biologie de l'École normale supérieure and * the individual authors. These should be listed in @author doc * comments. * * For more information on the Eoulsan project and its aims, * or to join the Eoulsan Google group, visit the home page * at: * * http://outils.genomique.biologie.ens.fr/eoulsan * */ package fr.ens.biologie.genomique.eoulsan.bio.alignmentsfilters; import static org.junit.Assert.assertEquals; import htsjdk.samtools.SAMLineParser; import htsjdk.samtools.SAMRecord; import java.util.ArrayList; import java.util.List; import org.junit.Before; import org.junit.Test; import fr.ens.biologie.genomique.eoulsan.bio.GenomeDescription; import fr.ens.biologie.genomique.eoulsan.bio.SAMUtils; import fr.ens.biologie.genomique.eoulsan.bio.alignmentsfilters.RemoveMultiMatchesReadAlignmentsFilter; /** * This class is a JUnit test class to test the class * RemoveMultiMatchesReadAlignments.java. * @author Claire Wallon */ public class RemoveMultiMatchesReadAlignmentsFilterTest { private String recordSE1, recordSE2; private String recordPE1, recordPE2, recordPE3, recordPE4; private SAMRecord samRecordSE1, samRecordSE2; private SAMRecord samRecordPE1, samRecordPE2, samRecordPE3, samRecordPE4; private RemoveMultiMatchesReadAlignmentsFilter filter; /** * @throws java.lang.Exception */ @Before public void setUp() throws Exception { // recordSE1 and recordSE2 have the same read name (two matches for the // same read) this.recordSE1 = "HWI-EAS285_0001_'':1:1:1259:2442#0/1\t16\tchr9\t59513044\t25\t76M\t*\t0\t0" + "\tGGGACTGCCTTCANNNAGANNCAGNANCTCCNNNNNNNNNNNNNNGACACCTTCCTGNAACACATGTGCCGCCTGG" + "\t#############################################ABE@?E@>CC@C#BBDEDGGGGFFEGEGGGG" + "\tXA:i:1\tMD:Z:13T0T0C3C0C3C1G4A0T0G0C0A0G0C0C0A0T0G0G0C0T12G18\tNM:i:22"; this.recordSE2 = "HWI-EAS285_0001_'':1:1:1259:2442#0/1\t0\tchr5\t22231887\t55\t76M\t*\t0\t0" + "\tCCAGGCGGCACATGTGTTNCAGGAAGGTGTCNNNNNNNNNNNNNNGGAGNTNCTGNNTCTNNNTGAAGGCAGTCCC" + "\tGGGGEGEFFGGGGDEDBB#C@CC>@E?@EBA#############################################\t" + "XA:i:1\tMD:Z:18C12A0G0C0C0A0T0G0G0C0T0G0C0A0T4C1G3G0G3G0A0A13\tNM:i:22"; // recordPE1, recordPE2, recordPE3 and recordPE4 have the same read name // (two matches for the same read) // recordPE1 and recordPE2 paired this.recordPE1 = "HWI-1KL110:37:C0BE6ACXX:7:1101:2584:2222\t99\tchr1\t173235257\t255\t101M\t=\t173235280\t124" + "\tCTTGTATCGCTCCTCAAACTTGACCTTGGCCTCCCGCCTGGCCTTGCGCTTCAAAGCTGGGTCCCTGAACACATCCTTGTTGACAACAGTCTTGTCCAAGG" + "\tCCCFFFFFHHHHHJJJJJJJJJJJJJJJJJJJJJJJJJHIIJIJJIIIIJJJJJIIJHHHHFFFFFDEEEEDDDDDDDDDDDDDDDDDDDDDEDDDDDDDD" + "\tXA:i:0\tMD:Z:101\tNM:i:0"; this.recordPE2 = "HWI-1KL110:37:C0BE6ACXX:7:1101:2584:2222\t147\tchr1\t173235280\t255\t101M\t=\t173235257\t-124" + "\tCCTTGGCCTCCCGCCTGGCCTTGCGCTTCAAAGCTGGGTCCCTGAACACATCCTTGTTGACAACAGTCTTGTCCAAGGGGATATCCACAGAGTACCTTGTG" + "\tDDDDDDDDDDDDDDDDDDDDDDDFFHHHHHHJJJJJJJJJHDJJJJJIJIHIJJJJJIIIJJJIJJIJJJJJHJJJJJJJJJJJJJJJHHHHHDFFFFCCC" + "\tXA:i:0\tMD:Z:101\tNM:i:0"; // recordPE3 and recordPE4 paired this.recordPE3 = "HWI-1KL110:37:C0BE6ACXX:7:1101:2584:2222\t99\tchr11\t93898574\t255\t101M\t=\t93898597\t124" + "\tCTTGTATCGCTCCTCAAACTTGACCTTGGCCTCCCGCCTGGCCTTGCGCTTCAAAGCTGGGTCCCTGAACACATCCTTGTTGACAACAGTCTTGTCCAAGG" + "\tCCCFFFFFHHHHHJJJJJJJJJJJJJJJJJJJJJJJJJHIIJIJJIIIIJJJJJIIJHHHHFFFFFDEEEEDDDDDDDDDDDDDDDDDDDDDEDDDDDDDD" + "\tXA:i:0\tMD:Z:101\tNM:i:0"; this.recordPE4 = "HWI-1KL110:37:C0BE6ACXX:7:1101:2584:2222\t147\tchr11\t93898597\t255\t101M\t=\t93898574\t-124" + "\tCCTTGGCCTCCCGCCTGGCCTTGCGCTTCAAAGCTGGGTCCCTGAACACATCCTTGTTGACAACAGTCTTGTCCAAGGGGATATCCACAGAGTACCTTGTG" + "\tDDDDDDDDDDDDDDDDDDDDDDDFFHHHHHHJJJJJJJJJHDJJJJJIJIHIJJJJJIIIJJJIJJIJJJJJHJJJJJJJJJJJJJJJHHHHHDFFFFCCC" + "\tXA:i:0\tMD:Z:101\tNM:i:0"; final GenomeDescription desc = new GenomeDescription(); desc.addSequence("chr1", 197195432); desc.addSequence("chr5", 152537259); desc.addSequence("chr9", 124076172); desc.addSequence("chr11", 121843856); SAMLineParser parser = new SAMLineParser(SAMUtils.newSAMFileHeader(desc)); this.samRecordSE1 = parser.parseLine(this.recordSE1); this.samRecordSE2 = parser.parseLine(this.recordSE2); this.samRecordPE1 = parser.parseLine(this.recordPE1); this.samRecordPE2 = parser.parseLine(this.recordPE2); this.samRecordPE3 = parser.parseLine(this.recordPE3); this.samRecordPE4 = parser.parseLine(this.recordPE4); this.filter = new RemoveMultiMatchesReadAlignmentsFilter(); } /** * Test method for {fr.ens.biologie.genomique.eoulsan.bio.alignmentsfilters. * RemoveMultiMatchesReadAlignmentsFilter#getName()}. */ @Test public void testGetName() { assertEquals("removemultimatches", this.filter.getName()); } /** * Test method for {fr.ens.biologie.genomique.eoulsan.bio.alignmentsfilters. * RemoveMultiMatchesReadAlignmentsFilter#getDescription()}. */ @Test public void testGetDescription() { assertEquals("Remove all the alignments with several matches", this.filter.getDescription()); } /** * Test method for {fr.ens.biologie.genomique.eoulsan.bio.alignmentsfilters. * RemoveMultiMatchesReadAlignmentsFilter#filterReadAlignments(java.util.List, * boolean)}. */ @Test public void testFilterReadAlignments() { final List<SAMRecord> records = new ArrayList<>(); final List<SAMRecord> recordsCheck = new ArrayList<>(); // single-end mode records.add(this.samRecordSE1); recordsCheck.add(this.samRecordSE1); this.filter.filterReadAlignments(records); assertEquals(records, recordsCheck); records.add(this.samRecordSE2); recordsCheck.clear(); this.filter.filterReadAlignments(records); assertEquals(records, recordsCheck); records.clear(); recordsCheck.clear(); // paired-end mode records.add(this.samRecordPE1); records.add(this.samRecordPE2); recordsCheck.add(this.samRecordPE1); recordsCheck.add(this.samRecordPE2); this.filter.filterReadAlignments(records); assertEquals(records, recordsCheck); records.add(this.samRecordPE3); records.add(this.samRecordPE4); recordsCheck.clear(); this.filter.filterReadAlignments(records); assertEquals(records, recordsCheck); records.clear(); records.add(this.samRecordPE1); assertEquals(1, records.size()); records.clear(); records.add(this.samRecordPE1); records.add(this.samRecordPE1); this.filter.filterReadAlignments(records); assertEquals(0, records.size()); records.clear(); records.add(this.samRecordPE2); assertEquals(1, records.size()); records.clear(); records.add(this.samRecordPE2); records.add(this.samRecordPE2); this.filter.filterReadAlignments(records); assertEquals(0, records.size()); records.clear(); records.add(this.samRecordPE1); records.add(this.samRecordPE2); records.add(this.samRecordPE2); this.filter.filterReadAlignments(records); assertEquals(0, records.size()); records.clear(); records.add(this.samRecordPE1); records.add(this.samRecordPE1); records.add(this.samRecordPE2); records.add(this.samRecordPE2); this.filter.filterReadAlignments(records); assertEquals(0, records.size()); records.clear(); records.add(this.samRecordPE1); records.add(this.samRecordPE2); this.filter.filterReadAlignments(records); assertEquals(2, records.size()); records.clear(); this.filter.filterReadAlignments(records); assertEquals(0, records.size()); } }