/* * Copyright [1999-2015] Wellcome Trust Sanger Institute and the EMBL-European Bioinformatics Institute * Copyright [2016-2017] EMBL-European Bioinformatics Institute * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.ensembl.healthcheck.testcase.generic; import java.sql.Connection; import org.ensembl.healthcheck.DatabaseRegistryEntry; import org.ensembl.healthcheck.DatabaseType; import org.ensembl.healthcheck.ReportManager; import org.ensembl.healthcheck.Team; import org.ensembl.healthcheck.testcase.SingleDatabaseTestCase; import org.ensembl.healthcheck.util.DBUtils; /** * Check that there are no duplicates in the assembly table. */ public class DuplicateAssembly extends SingleDatabaseTestCase { /** * Create a new DuplicateAssembly testcase. */ public DuplicateAssembly() { setDescription("Check that there are no duplicates in the assembly table"); setTeamResponsible(Team.GENEBUILD); } /** * Data is only tested in core database, as the tables are in sync */ public void types() { removeAppliesToType(DatabaseType.OTHERFEATURES); removeAppliesToType(DatabaseType.ESTGENE); removeAppliesToType(DatabaseType.RNASEQ); removeAppliesToType(DatabaseType.CDNA); } /** * Run the test. * * @param dbre * The database to use. * @return true if the test passed. * */ public boolean run(DatabaseRegistryEntry dbre) { boolean result = true; Connection con = dbre.getConnection(); int rows = DBUtils.getRowCount(con, "SELECT *, COUNT(*) AS c FROM assembly GROUP BY asm_seq_region_id, cmp_seq_region_id, asm_start, asm_end, cmp_start, cmp_end, ori HAVING c > 1"); if (rows > 0) { ReportManager.problem(this, con, "At least " + rows + " duplicate rows in assembly table"); result = false; } else { ReportManager.correct(this, con, "No duplicate rows in the assembly table"); } return result; } // run /** * Note more details can be obtained via: * * SELECT a.*, sr1.name, cs1.name, sr2.name, cs2.name, COUNT(*) AS c FROM assembly a, seq_region sr1, seq_region sr2, coord_system * cs1, coord_system cs2 WHERE a.cmp_seq_region_id = sr1.seq_region_id AND sr1.coord_system_id = cs1.coord_system_id AND * a.asm_seq_region_id = sr2.seq_region_id AND sr2.coord_system_id = cs2.coord_system_id GROUP BY asm_seq_region_id, * cmp_seq_region_id, asm_start, asm_end, cmp_start, cmp_end, ori HAVING c > 1; */ } // DuplicateAssembly